3aa862896b
Review URL: https://codereview.chromium.org/1485823003 Cr-Commit-Position: refs/heads/master@{#32535}
375 lines
11 KiB
C++
375 lines
11 KiB
C++
// Copyright 2014 the V8 project authors. All rights reserved.
|
|
// Redistribution and use in source and binary forms, with or without
|
|
// modification, are permitted provided that the following conditions are
|
|
// met:
|
|
//
|
|
// * Redistributions of source code must retain the above copyright
|
|
// notice, this list of conditions and the following disclaimer.
|
|
// * Redistributions in binary form must reproduce the above
|
|
// copyright notice, this list of conditions and the following
|
|
// disclaimer in the documentation and/or other materials provided
|
|
// with the distribution.
|
|
// * Neither the name of Google Inc. nor the names of its
|
|
// contributors may be used to endorse or promote products derived
|
|
// from this software without specific prior written permission.
|
|
//
|
|
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
#ifndef V8_AST_AST_VALUE_FACTORY_H_
|
|
#define V8_AST_AST_VALUE_FACTORY_H_
|
|
|
|
#include "src/api.h"
|
|
#include "src/hashmap.h"
|
|
#include "src/utils.h"
|
|
|
|
// AstString, AstValue and AstValueFactory are for storing strings and values
|
|
// independent of the V8 heap and internalizing them later. During parsing,
|
|
// AstStrings and AstValues are created and stored outside the heap, in
|
|
// AstValueFactory. After parsing, the strings and values are internalized
|
|
// (moved into the V8 heap).
|
|
namespace v8 {
|
|
namespace internal {
|
|
|
|
class AstString : public ZoneObject {
|
|
public:
|
|
virtual ~AstString() {}
|
|
|
|
virtual int length() const = 0;
|
|
bool IsEmpty() const { return length() == 0; }
|
|
|
|
// Puts the string into the V8 heap.
|
|
virtual void Internalize(Isolate* isolate) = 0;
|
|
|
|
// This function can be called after internalizing.
|
|
V8_INLINE Handle<String> string() const {
|
|
DCHECK(!string_.is_null());
|
|
return string_;
|
|
}
|
|
|
|
protected:
|
|
// This is null until the string is internalized.
|
|
Handle<String> string_;
|
|
};
|
|
|
|
|
|
class AstRawString : public AstString {
|
|
public:
|
|
int length() const override {
|
|
if (is_one_byte_)
|
|
return literal_bytes_.length();
|
|
return literal_bytes_.length() / 2;
|
|
}
|
|
|
|
int byte_length() const { return literal_bytes_.length(); }
|
|
|
|
void Internalize(Isolate* isolate) override;
|
|
|
|
bool AsArrayIndex(uint32_t* index) const;
|
|
|
|
// The string is not null-terminated, use length() to find out the length.
|
|
const unsigned char* raw_data() const {
|
|
return literal_bytes_.start();
|
|
}
|
|
bool is_one_byte() const { return is_one_byte_; }
|
|
bool IsOneByteEqualTo(const char* data) const;
|
|
uint16_t FirstCharacter() const {
|
|
if (is_one_byte_)
|
|
return literal_bytes_[0];
|
|
const uint16_t* c =
|
|
reinterpret_cast<const uint16_t*>(literal_bytes_.start());
|
|
return *c;
|
|
}
|
|
|
|
// For storing AstRawStrings in a hash map.
|
|
uint32_t hash() const {
|
|
return hash_;
|
|
}
|
|
|
|
private:
|
|
friend class AstValueFactory;
|
|
friend class AstRawStringInternalizationKey;
|
|
|
|
AstRawString(bool is_one_byte, const Vector<const byte>& literal_bytes,
|
|
uint32_t hash)
|
|
: is_one_byte_(is_one_byte), literal_bytes_(literal_bytes), hash_(hash) {}
|
|
|
|
AstRawString()
|
|
: is_one_byte_(true),
|
|
hash_(0) {}
|
|
|
|
bool is_one_byte_;
|
|
|
|
// Points to memory owned by Zone.
|
|
Vector<const byte> literal_bytes_;
|
|
uint32_t hash_;
|
|
};
|
|
|
|
|
|
class AstConsString : public AstString {
|
|
public:
|
|
AstConsString(const AstString* left, const AstString* right)
|
|
: left_(left),
|
|
right_(right) {}
|
|
|
|
int length() const override { return left_->length() + right_->length(); }
|
|
|
|
void Internalize(Isolate* isolate) override;
|
|
|
|
private:
|
|
friend class AstValueFactory;
|
|
|
|
const AstString* left_;
|
|
const AstString* right_;
|
|
};
|
|
|
|
|
|
// AstValue is either a string, a number, a string array, a boolean, or a
|
|
// special value (null, undefined, the hole).
|
|
class AstValue : public ZoneObject {
|
|
public:
|
|
bool IsString() const {
|
|
return type_ == STRING;
|
|
}
|
|
|
|
bool IsNumber() const {
|
|
return type_ == NUMBER || type_ == NUMBER_WITH_DOT || type_ == SMI;
|
|
}
|
|
|
|
bool ContainsDot() const { return type_ == NUMBER_WITH_DOT; }
|
|
|
|
const AstRawString* AsString() const {
|
|
if (type_ == STRING)
|
|
return string_;
|
|
UNREACHABLE();
|
|
return 0;
|
|
}
|
|
|
|
double AsNumber() const {
|
|
if (type_ == NUMBER || type_ == NUMBER_WITH_DOT)
|
|
return number_;
|
|
if (type_ == SMI)
|
|
return smi_;
|
|
UNREACHABLE();
|
|
return 0;
|
|
}
|
|
|
|
bool EqualsString(const AstRawString* string) const {
|
|
return type_ == STRING && string_ == string;
|
|
}
|
|
|
|
bool IsPropertyName() const;
|
|
|
|
bool BooleanValue() const;
|
|
|
|
bool IsTheHole() const { return type_ == THE_HOLE; }
|
|
|
|
void Internalize(Isolate* isolate);
|
|
|
|
// Can be called after Internalize has been called.
|
|
V8_INLINE Handle<Object> value() const {
|
|
if (type_ == STRING) {
|
|
return string_->string();
|
|
}
|
|
DCHECK(!value_.is_null());
|
|
return value_;
|
|
}
|
|
|
|
private:
|
|
friend class AstValueFactory;
|
|
|
|
enum Type {
|
|
STRING,
|
|
SYMBOL,
|
|
NUMBER,
|
|
NUMBER_WITH_DOT,
|
|
SMI,
|
|
BOOLEAN,
|
|
NULL_TYPE,
|
|
UNDEFINED,
|
|
THE_HOLE
|
|
};
|
|
|
|
explicit AstValue(const AstRawString* s) : type_(STRING) { string_ = s; }
|
|
|
|
explicit AstValue(const char* name) : type_(SYMBOL) { symbol_name_ = name; }
|
|
|
|
explicit AstValue(double n, bool with_dot) {
|
|
if (with_dot) {
|
|
type_ = NUMBER_WITH_DOT;
|
|
} else {
|
|
type_ = NUMBER;
|
|
}
|
|
number_ = n;
|
|
}
|
|
|
|
AstValue(Type t, int i) : type_(t) {
|
|
DCHECK(type_ == SMI);
|
|
smi_ = i;
|
|
}
|
|
|
|
explicit AstValue(bool b) : type_(BOOLEAN) { bool_ = b; }
|
|
|
|
explicit AstValue(Type t) : type_(t) {
|
|
DCHECK(t == NULL_TYPE || t == UNDEFINED || t == THE_HOLE);
|
|
}
|
|
|
|
Type type_;
|
|
|
|
// Uninternalized value.
|
|
union {
|
|
const AstRawString* string_;
|
|
double number_;
|
|
int smi_;
|
|
bool bool_;
|
|
ZoneList<const AstRawString*>* strings_;
|
|
const char* symbol_name_;
|
|
};
|
|
|
|
// Internalized value (empty before internalized).
|
|
Handle<Object> value_;
|
|
};
|
|
|
|
|
|
// For generating constants.
|
|
#define STRING_CONSTANTS(F) \
|
|
F(anonymous_function, "(anonymous function)") \
|
|
F(arguments, "arguments") \
|
|
F(constructor, "constructor") \
|
|
F(default, "default") \
|
|
F(done, "done") \
|
|
F(dot, ".") \
|
|
F(dot_for, ".for") \
|
|
F(dot_generator, ".generator") \
|
|
F(dot_generator_object, ".generator_object") \
|
|
F(dot_iterator, ".iterator") \
|
|
F(dot_result, ".result") \
|
|
F(dot_switch_tag, ".switch_tag") \
|
|
F(dot_catch, ".catch") \
|
|
F(empty, "") \
|
|
F(eval, "eval") \
|
|
F(let, "let") \
|
|
F(native, "native") \
|
|
F(new_target, ".new.target") \
|
|
F(next, "next") \
|
|
F(proto, "__proto__") \
|
|
F(prototype, "prototype") \
|
|
F(this, "this") \
|
|
F(this_function, ".this_function") \
|
|
F(undefined, "undefined") \
|
|
F(use_asm, "use asm") \
|
|
F(use_strong, "use strong") \
|
|
F(use_strict, "use strict") \
|
|
F(value, "value")
|
|
|
|
#define OTHER_CONSTANTS(F) \
|
|
F(true_value) \
|
|
F(false_value) \
|
|
F(null_value) \
|
|
F(undefined_value) \
|
|
F(the_hole_value)
|
|
|
|
class AstValueFactory {
|
|
public:
|
|
AstValueFactory(Zone* zone, uint32_t hash_seed)
|
|
: string_table_(AstRawStringCompare),
|
|
zone_(zone),
|
|
isolate_(NULL),
|
|
hash_seed_(hash_seed) {
|
|
#define F(name, str) name##_string_ = NULL;
|
|
STRING_CONSTANTS(F)
|
|
#undef F
|
|
#define F(name) name##_ = NULL;
|
|
OTHER_CONSTANTS(F)
|
|
#undef F
|
|
}
|
|
|
|
Zone* zone() const { return zone_; }
|
|
|
|
const AstRawString* GetOneByteString(Vector<const uint8_t> literal) {
|
|
return GetOneByteStringInternal(literal);
|
|
}
|
|
const AstRawString* GetOneByteString(const char* string) {
|
|
return GetOneByteString(Vector<const uint8_t>(
|
|
reinterpret_cast<const uint8_t*>(string), StrLength(string)));
|
|
}
|
|
const AstRawString* GetTwoByteString(Vector<const uint16_t> literal) {
|
|
return GetTwoByteStringInternal(literal);
|
|
}
|
|
const AstRawString* GetString(Handle<String> literal);
|
|
const AstConsString* NewConsString(const AstString* left,
|
|
const AstString* right);
|
|
|
|
void Internalize(Isolate* isolate);
|
|
bool IsInternalized() {
|
|
return isolate_ != NULL;
|
|
}
|
|
|
|
#define F(name, str) \
|
|
const AstRawString* name##_string() { \
|
|
if (name##_string_ == NULL) { \
|
|
const char* data = str; \
|
|
name##_string_ = GetOneByteString( \
|
|
Vector<const uint8_t>(reinterpret_cast<const uint8_t*>(data), \
|
|
static_cast<int>(strlen(data)))); \
|
|
} \
|
|
return name##_string_; \
|
|
}
|
|
STRING_CONSTANTS(F)
|
|
#undef F
|
|
|
|
const AstValue* NewString(const AstRawString* string);
|
|
// A JavaScript symbol (ECMA-262 edition 6).
|
|
const AstValue* NewSymbol(const char* name);
|
|
const AstValue* NewNumber(double number, bool with_dot = false);
|
|
const AstValue* NewSmi(int number);
|
|
const AstValue* NewBoolean(bool b);
|
|
const AstValue* NewStringList(ZoneList<const AstRawString*>* strings);
|
|
const AstValue* NewNull();
|
|
const AstValue* NewUndefined();
|
|
const AstValue* NewTheHole();
|
|
|
|
private:
|
|
AstRawString* GetOneByteStringInternal(Vector<const uint8_t> literal);
|
|
AstRawString* GetTwoByteStringInternal(Vector<const uint16_t> literal);
|
|
AstRawString* GetString(uint32_t hash, bool is_one_byte,
|
|
Vector<const byte> literal_bytes);
|
|
|
|
static bool AstRawStringCompare(void* a, void* b);
|
|
|
|
// All strings are copied here, one after another (no NULLs inbetween).
|
|
HashMap string_table_;
|
|
// For keeping track of all AstValues and AstRawStrings we've created (so that
|
|
// they can be internalized later).
|
|
List<AstValue*> values_;
|
|
List<AstString*> strings_;
|
|
Zone* zone_;
|
|
Isolate* isolate_;
|
|
|
|
uint32_t hash_seed_;
|
|
|
|
#define F(name, str) const AstRawString* name##_string_;
|
|
STRING_CONSTANTS(F)
|
|
#undef F
|
|
|
|
#define F(name) AstValue* name##_;
|
|
OTHER_CONSTANTS(F)
|
|
#undef F
|
|
};
|
|
} // namespace internal
|
|
} // namespace v8
|
|
|
|
#undef STRING_CONSTANTS
|
|
#undef OTHER_CONSTANTS
|
|
|
|
#endif // V8_AST_AST_VALUE_FACTORY_H_
|