Source code

Revision control

Copy as Markdown

Other Tools

/* -*- Mode: C++; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 2 -*-
* vim: set ts=8 sts=2 et sw=2 tw=80:
*
* Copyright 2015 Mozilla Foundation
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "wasm/WasmTypeDef.h"
#include "mozilla/MathAlgorithms.h"
#include "jit/JitOptions.h"
#include "js/friend/ErrorMessages.h" // JSMSG_*
#include "js/HashTable.h"
#include "js/Printf.h"
#include "js/Value.h"
#include "threading/ExclusiveData.h"
#include "vm/Runtime.h"
#include "vm/StringType.h"
#include "wasm/WasmCodegenConstants.h"
#include "wasm/WasmGcObject.h"
#include "wasm/WasmJS.h"
using namespace js;
using namespace js::jit;
using namespace js::wasm;
using mozilla::CheckedInt32;
using mozilla::CheckedUint32;
using mozilla::IsPowerOfTwo;
using mozilla::MallocSizeOf;
// [SMDOC] Immediate type signature encoding
//
// call_indirect requires a signature check to ensure the dynamic callee type
// matches the static specified callee type. This involves comparing whether
// the two function types are equal. We canonicalize function types so that
// comparing the pointers of the types will indicate if they're equal. The
// canonicalized function types are loaded from the instance at runtime.
//
// For the common case of simple/small function types, we can avoid the cost
// of loading the function type pointers from the instance by having an
// alternate 'immediate' form that encodes a function type in a constant.
// We encode the function types such that bitwise equality implies the original
// function types were equal. We use a tag bit such that if one of the types
// is a pointer and the other an immediate, they will not compare as equal.
//
// The encoding is optimized for common function types that have at most one
// result and an arbitrary amount of arguments.
//
// [
// 1 bit : tag (always 1),
// 1 bit : numResults,
// 3 bits : numArgs,
// numResults * 3 bits : results,
// numArgs * 3 bits : args
// ]
// (lsb -> msb order)
//
// Any function type that cannot be encoded in the above format is falls back
// to the pointer representation.
//
//=========================================================================
// ImmediateType
// ImmediateType is 32-bits to ensure it's easy to materialize the constant
// on all platforms.
using ImmediateType = uint32_t;
static const unsigned sTotalBits = sizeof(ImmediateType) * 8;
static const unsigned sTagBits = 1;
static const unsigned sNumResultsBits = 1;
static const unsigned sNumArgsBits = 3;
static const unsigned sValTypeBits = 3;
static const unsigned sMaxValTypes = 8;
static_assert(((1 << sNumResultsBits) - 1) + ((1 << sNumArgsBits) - 1) ==
sMaxValTypes,
"sNumResultsBits, sNumArgsBits, sMaxValTypes are consistent");
static_assert(sTagBits + sNumResultsBits + sNumArgsBits +
sValTypeBits * sMaxValTypes <=
sTotalBits,
"have room");
static bool IsImmediateValType(ValType vt) {
switch (vt.kind()) {
case ValType::I32:
case ValType::I64:
case ValType::F32:
case ValType::F64:
case ValType::V128:
return true;
case ValType::Ref:
// We don't have space to encode nullability, so we optimize for
// non-nullable types.
if (!vt.isNullable()) {
return false;
}
switch (vt.refType().kind()) {
case RefType::Func:
case RefType::Extern:
case RefType::Any:
return true;
default:
return false;
}
default:
return false;
}
}
static unsigned EncodeImmediateValType(ValType vt) {
// We have run out of bits for each type, anything new must increase the
// sValTypeBits.
static_assert(7 < (1 << sValTypeBits), "enough space for ValType kind");
switch (vt.kind()) {
case ValType::I32:
return 0;
case ValType::I64:
return 1;
case ValType::F32:
return 2;
case ValType::F64:
return 3;
case ValType::V128:
return 4;
case ValType::Ref:
MOZ_ASSERT(vt.isNullable());
switch (vt.refType().kind()) {
case RefType::Func:
return 5;
case RefType::Extern:
return 6;
case RefType::Any:
return 7;
default:
MOZ_CRASH("bad RefType");
}
default:
MOZ_CRASH("bad ValType");
}
}
static bool IsImmediateFuncType(const FuncType& funcType) {
const ValTypeVector& results = funcType.results();
const ValTypeVector& args = funcType.args();
// Check the number of results and args fits
if (results.length() > ((1 << sNumResultsBits) - 1) ||
args.length() > ((1 << sNumArgsBits) - 1)) {
return false;
}
// Ensure every result is compatible
for (ValType v : results) {
if (!IsImmediateValType(v)) {
return false;
}
}
// Ensure every arg is compatible
for (ValType v : args) {
if (!IsImmediateValType(v)) {
return false;
}
}
return true;
}
static ImmediateType EncodeNumResults(uint32_t numResults) {
MOZ_ASSERT(numResults <= (1 << sNumResultsBits) - 1);
return numResults;
}
static ImmediateType EncodeNumArgs(uint32_t numArgs) {
MOZ_ASSERT(numArgs <= (1 << sNumArgsBits) - 1);
return numArgs;
}
static ImmediateType EncodeImmediateFuncType(const FuncType& funcType) {
ImmediateType immediate = FuncType::ImmediateBit;
uint32_t shift = sTagBits;
// Encode the results
immediate |= EncodeNumResults(funcType.results().length()) << shift;
shift += sNumResultsBits;
for (ValType resultType : funcType.results()) {
immediate |= EncodeImmediateValType(resultType) << shift;
shift += sValTypeBits;
}
// Encode the args
immediate |= EncodeNumArgs(funcType.args().length()) << shift;
shift += sNumArgsBits;
for (ValType argType : funcType.args()) {
immediate |= EncodeImmediateValType(argType) << shift;
shift += sValTypeBits;
}
MOZ_ASSERT(shift <= sTotalBits);
return immediate;
}
//=========================================================================
// FuncType
void FuncType::initImmediateTypeId(bool gcEnabled, bool isFinal,
const TypeDef* superTypeDef,
uint32_t recGroupLength) {
// To improve the performance of the structural type check in
// the call_indirect function prologue, we attempt to encode the
// entire function type into an immediate such that bitwise equality
// implies structural equality. With the GC proposal, we don't
// want to generalize the immediate form for the new type system, so
// we don't use it when a type is non-final (i.e. may have sub types), or
// has super types, or is in a recursion group with other types.
//
// If non-final types are allowed, then the type can have subtypes, and we
// should therefore do a full subtype check on call_indirect, which
// doesn't work well with immediates. If the type has a super type, the
// same reason applies. And finally, types in recursion groups of
// size > 1 may not be considered equivalent even if they are
// structurally equivalent in every respect.
if (gcEnabled && (!isFinal || superTypeDef || recGroupLength != 1)) {
immediateTypeId_ = NO_IMMEDIATE_TYPE_ID;
return;
}
// Otherwise, try to encode this function type into an immediate.
if (!IsImmediateFuncType(*this)) {
immediateTypeId_ = NO_IMMEDIATE_TYPE_ID;
return;
}
immediateTypeId_ = EncodeImmediateFuncType(*this);
}
bool FuncType::canHaveJitEntry() const {
return !hasUnexposableArgOrRet() &&
!temporarilyUnsupportedReftypeForEntry() &&
!temporarilyUnsupportedResultCountForJitEntry() &&
JitOptions.enableWasmJitEntry;
}
bool FuncType::canHaveJitExit() const {
return !hasUnexposableArgOrRet() && !temporarilyUnsupportedReftypeForExit() &&
!hasInt64Arg() && !temporarilyUnsupportedResultCountForJitExit() &&
JitOptions.enableWasmJitExit;
}
size_t FuncType::sizeOfExcludingThis(MallocSizeOf mallocSizeOf) const {
return args_.sizeOfExcludingThis(mallocSizeOf);
}
//=========================================================================
// StructType and StructLayout
static inline CheckedInt32 RoundUpToAlignment(CheckedInt32 address,
uint32_t align) {
MOZ_ASSERT(IsPowerOfTwo(align));
// Note: Be careful to order operators such that we first make the
// value smaller and then larger, so that we don't get false
// overflow errors due to (e.g.) adding `align` and then
// subtracting `1` afterwards when merely adding `align-1` would
// not have overflowed. Note that due to the nature of two's
// complement representation, if `address` is already aligned,
// then adding `align-1` cannot itself cause an overflow.
return ((address + (align - 1)) / align) * align;
}
CheckedInt32 StructLayout::addField(StorageType type) {
uint32_t fieldSize = type.size();
uint32_t fieldAlignment = type.alignmentInStruct();
// We have to ensure that `offset` is chosen so that no field crosses the
// inline/outline boundary. The assertions here ensure that. See comment
// on `class StructLayout` for background.
MOZ_ASSERT(fieldSize >= 1 && fieldSize <= 16);
MOZ_ASSERT((fieldSize & (fieldSize - 1)) == 0); // is a power of 2
MOZ_ASSERT(fieldAlignment == fieldSize); // is naturally aligned
// Alignment of the struct is the max of the alignment of its fields.
structAlignment = std::max(structAlignment, fieldAlignment);
// Align the pointer.
CheckedInt32 offset = RoundUpToAlignment(sizeSoFar, fieldAlignment);
if (!offset.isValid()) {
return offset;
}
// Allocate space.
sizeSoFar = offset + fieldSize;
if (!sizeSoFar.isValid()) {
return sizeSoFar;
}
// The following should hold if the three assertions above hold.
MOZ_ASSERT(offset / 16 == (offset + fieldSize - 1) / 16);
return offset;
}
CheckedInt32 StructLayout::close() {
CheckedInt32 size = RoundUpToAlignment(sizeSoFar, structAlignment);
// What we are computing into `size` is the size of
// WasmGcObject::inlineData_, or the size of the outline data area. Either
// way, it is helpful if the area size is an integral number of machine
// words, since this would make any initialisation loop for inline
// allocation able to operate on machine word sized units, should we decide
// to do inline allocation.
if (structAlignment < sizeof(uintptr_t)) {
size = RoundUpToAlignment(size, sizeof(uintptr_t));
}
return size;
}
bool StructType::init() {
StructLayout layout;
for (FieldType& field : fields_) {
CheckedInt32 offset = layout.addField(field.type);
if (!offset.isValid()) {
return false;
}
if (!fieldOffsets_.append(offset.value())) {
return false;
}
if (!field.type.isRefRepr()) {
continue;
}
bool isOutline;
uint32_t adjustedOffset;
WasmStructObject::fieldOffsetToAreaAndOffset(field.type, offset.value(),
&isOutline, &adjustedOffset);
if (isOutline) {
if (!outlineTraceOffsets_.append(adjustedOffset)) {
return false;
}
} else {
if (!inlineTraceOffsets_.append(adjustedOffset)) {
return false;
}
}
}
CheckedInt32 size = layout.close();
if (!size.isValid()) {
return false;
}
size_ = size.value();
return true;
}
/* static */
bool StructType::createImmutable(const ValTypeVector& types,
StructType* struct_) {
FieldTypeVector fields;
if (!fields.resize(types.length())) {
return false;
}
for (size_t i = 0; i < types.length(); i++) {
fields[i].type = StorageType(types[i].packed());
fields[i].isMutable = false;
}
*struct_ = StructType(std::move(fields));
return struct_->init();
}
size_t StructType::sizeOfExcludingThis(MallocSizeOf mallocSizeOf) const {
return fields_.sizeOfExcludingThis(mallocSizeOf);
}
size_t ArrayType::sizeOfExcludingThis(MallocSizeOf mallocSizeOf) const {
return 0;
}
size_t TypeDef::sizeOfExcludingThis(MallocSizeOf mallocSizeOf) const {
switch (kind_) {
case TypeDefKind::Struct: {
return structType_.sizeOfExcludingThis(mallocSizeOf);
}
case TypeDefKind::Func: {
return funcType_.sizeOfExcludingThis(mallocSizeOf);
}
case TypeDefKind::Array: {
return arrayType_.sizeOfExcludingThis(mallocSizeOf);
}
case TypeDefKind::None: {
return 0;
}
default:
break;
}
MOZ_ASSERT_UNREACHABLE();
return 0;
}
//=========================================================================
// SuperTypeVector
/* static */
size_t SuperTypeVector::offsetOfSTVInVector(uint32_t subTypingDepth) {
return offsetof(SuperTypeVector, types_) + sizeof(void*) * subTypingDepth;
}
/* static */
size_t SuperTypeVector::lengthForTypeDef(const TypeDef& typeDef) {
return std::max(uint32_t(typeDef.subTypingDepth()) + 1,
MinSuperTypeVectorLength);
}
/* static */
size_t SuperTypeVector::byteSizeForTypeDef(const TypeDef& typeDef) {
static_assert(
sizeof(SuperTypeVector) + sizeof(void*) * (MaxSubTypingDepth + 1) <=
UINT16_MAX,
"cannot overflow");
return sizeof(SuperTypeVector) + (sizeof(void*) * lengthForTypeDef(typeDef));
}
/* static */
const SuperTypeVector* SuperTypeVector::createMultipleForRecGroup(
RecGroup* recGroup) {
// Pre-size the amount of space needed for all the super type vectors in this
// recursion group.
CheckedUint32 totalBytes = 0;
for (uint32_t typeIndex = 0; typeIndex < recGroup->numTypes(); typeIndex++) {
totalBytes +=
SuperTypeVector::byteSizeForTypeDef(recGroup->type(typeIndex));
}
if (!totalBytes.isValid()) {
return nullptr;
}
// Allocate the batch, and retain reference to the first one.
SuperTypeVector* firstVector =
(SuperTypeVector*)js_malloc(totalBytes.value());
if (!firstVector) {
return nullptr;
}
// Initialize the vectors, one by one
SuperTypeVector* currentVector = firstVector;
for (uint32_t typeIndex = 0; typeIndex < recGroup->numTypes(); typeIndex++) {
TypeDef& typeDef = recGroup->type(typeIndex);
// Compute the size again to know where the next vector can be found.
size_t vectorByteSize = SuperTypeVector::byteSizeForTypeDef(typeDef);
// Make the typedef and the vector point at each other.
typeDef.setSuperTypeVector(currentVector);
currentVector->typeDef_ = &typeDef;
currentVector->subTypingDepth_ = typeDef.subTypingDepth();
// Every vector stores all ancestor types and itself.
currentVector->length_ = SuperTypeVector::lengthForTypeDef(typeDef);
// Initialize the entries in the vector
const TypeDef* currentTypeDef = &typeDef;
for (uint32_t index = 0; index < currentVector->length(); index++) {
uint32_t reverseIndex = currentVector->length() - index - 1;
// If this entry is required just to hit the minimum size, then
// initialize it to null.
if (reverseIndex > typeDef.subTypingDepth()) {
currentVector->types_[reverseIndex] = nullptr;
continue;
}
// Otherwise we should always be iterating at the same depth as our
// currentTypeDef.
MOZ_ASSERT(reverseIndex == currentTypeDef->subTypingDepth());
currentVector->types_[reverseIndex] = currentTypeDef->superTypeVector();
currentTypeDef = currentTypeDef->superTypeDef();
}
// There should be no more super types left over
MOZ_ASSERT(currentTypeDef == nullptr);
// Advance to the next super type vector
currentVector =
(SuperTypeVector*)(((const char*)currentVector) + vectorByteSize);
}
return firstVector;
}
//=========================================================================
// TypeIdSet and TypeContext
struct RecGroupHashPolicy {
using Lookup = const SharedRecGroup&;
static HashNumber hash(Lookup lookup) { return lookup->hash(); }
static bool match(const SharedRecGroup& lhs, Lookup rhs) {
return RecGroup::matches(*rhs, *lhs);
}
};
// A global hash set of recursion groups for use in fast type equality checks.
class TypeIdSet {
using Set = HashSet<SharedRecGroup, RecGroupHashPolicy, SystemAllocPolicy>;
Set set_;
public:
// Attempt to insert a recursion group into the set, returning an existing
// recursion group if there was one.
SharedRecGroup insert(SharedRecGroup recGroup) {
Set::AddPtr p = set_.lookupForAdd(recGroup);
if (p) {
// A canonical recursion group already existed, return it.
return *p;
}
// Insert this recursion group into the set, and return it as the canonical
// recursion group instance.
if (!set_.add(p, recGroup)) {
return nullptr;
}
return recGroup;
}
void purge() {
// TODO: this is not guaranteed to remove all types that are not referenced
// from outside the canonical set, as removing a type may make a previous
// type we've visited now only have one ref and be eligible to be freed.
//
// Solving this either involves iterating to a fixed point, or else a much
// more invasive change to the lifetime management of recursion groups.
for (auto iter = set_.modIter(); !iter.done(); iter.next()) {
if (iter.get()->hasOneRef()) {
iter.remove();
}
}
}
// Release the provided recursion group reference and remove it from the
// canonical set if it was the last reference. This is one unified method
// because we need to perform the lookup before releasing the reference, but
// need to release the reference in order to see if it was the last reference
// outside the canonical set.
void clearRecGroup(SharedRecGroup* recGroupCell) {
if (Set::Ptr p = set_.lookup(*recGroupCell)) {
*recGroupCell = nullptr;
if ((*p)->hasOneRef()) {
set_.remove(p);
}
} else {
*recGroupCell = nullptr;
}
}
};
ExclusiveData<TypeIdSet> typeIdSet(mutexid::WasmTypeIdSet);
void wasm::PurgeCanonicalTypes() {
ExclusiveData<TypeIdSet>::Guard locked = typeIdSet.lock();
locked->purge();
}
SharedRecGroup TypeContext::canonicalizeGroup(SharedRecGroup recGroup) {
ExclusiveData<TypeIdSet>::Guard locked = typeIdSet.lock();
return locked->insert(recGroup);
}
TypeContext::~TypeContext() {
ExclusiveData<TypeIdSet>::Guard locked = typeIdSet.lock();
// Clear out the recursion groups in this module, freeing them from the
// canonical type set if needed.
//
// We iterate backwards here so that we free every previous recursion group
// that may be referring to the current recursion group we're freeing. This
// is possible due to recursion groups being ordered.
for (int32_t groupIndex = recGroups_.length() - 1; groupIndex >= 0;
groupIndex--) {
// Try to remove this entry from the canonical set if we have the last
// strong reference. The entry may not exist if canonicalization failed
// and this type context was aborted. This will clear the reference in the
// vector.
locked->clearRecGroup(&recGroups_[groupIndex]);
}
}