// Copyright 2015 the V8 project authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #ifndef V8_WASM_MODULE_H_ #define V8_WASM_MODULE_H_ #include <memory> #include "src/api.h" #include "src/globals.h" #include "src/handles.h" #include "src/parsing/preparse-data.h" #include "src/wasm/managed.h" #include "src/wasm/signature-map.h" #include "src/wasm/wasm-opcodes.h" namespace v8 { namespace internal { namespace compiler { class CallDescriptor; class WasmCompilationUnit; } namespace wasm { class ErrorThrower; const size_t kMaxModuleSize = 1024 * 1024 * 1024; const size_t kMaxFunctionSize = 128 * 1024; const size_t kMaxStringSize = 256; const uint32_t kWasmMagic = 0x6d736100; const uint32_t kWasmVersion = 0x0d; const uint8_t kWasmFunctionTypeForm = 0x60; const uint8_t kWasmAnyFunctionTypeForm = 0x70; enum WasmSectionCode { kUnknownSectionCode = 0, // code for unknown sections kTypeSectionCode = 1, // Function signature declarations kImportSectionCode = 2, // Import declarations kFunctionSectionCode = 3, // Function declarations kTableSectionCode = 4, // Indirect function table and other tables kMemorySectionCode = 5, // Memory attributes kGlobalSectionCode = 6, // Global declarations kExportSectionCode = 7, // Exports kStartSectionCode = 8, // Start function declaration kElementSectionCode = 9, // Elements section kCodeSectionCode = 10, // Function code kDataSectionCode = 11, // Data segments kNameSectionCode = 12, // Name section (encoded as a string) }; inline bool IsValidSectionCode(uint8_t byte) { return kTypeSectionCode <= byte && byte <= kDataSectionCode; } const char* SectionName(WasmSectionCode code); class WasmDebugInfo; // Constants for fixed-size elements within a module. static const uint32_t kMaxReturnCount = 1; static const uint8_t kResizableMaximumFlag = 1; static const int32_t kInvalidFunctionIndex = -1; enum WasmExternalKind { kExternalFunction = 0, kExternalTable = 1, kExternalMemory = 2, kExternalGlobal = 3 }; // Representation of an initializer expression. struct WasmInitExpr { enum WasmInitKind { kNone, kGlobalIndex, kI32Const, kI64Const, kF32Const, kF64Const } kind; union { int32_t i32_const; int64_t i64_const; float f32_const; double f64_const; uint32_t global_index; } val; WasmInitExpr() : kind(kNone) {} explicit WasmInitExpr(int32_t v) : kind(kI32Const) { val.i32_const = v; } explicit WasmInitExpr(int64_t v) : kind(kI64Const) { val.i64_const = v; } explicit WasmInitExpr(float v) : kind(kF32Const) { val.f32_const = v; } explicit WasmInitExpr(double v) : kind(kF64Const) { val.f64_const = v; } WasmInitExpr(WasmInitKind kind, uint32_t global_index) : kind(kGlobalIndex) { val.global_index = global_index; } }; // Static representation of a WASM function. struct WasmFunction { FunctionSig* sig; // signature of the function. uint32_t func_index; // index into the function table. uint32_t sig_index; // index into the signature table. uint32_t name_offset; // offset in the module bytes of the name, if any. uint32_t name_length; // length in bytes of the name. uint32_t code_start_offset; // offset in the module bytes of code start. uint32_t code_end_offset; // offset in the module bytes of code end. bool imported; bool exported; }; // Static representation of a wasm global variable. struct WasmGlobal { LocalType type; // type of the global. bool mutability; // {true} if mutable. WasmInitExpr init; // the initialization expression of the global. uint32_t offset; // offset into global memory. bool imported; // true if imported. bool exported; // true if exported. }; // Static representation of a wasm data segment. struct WasmDataSegment { WasmInitExpr dest_addr; // destination memory address of the data. uint32_t source_offset; // start offset in the module bytes. uint32_t source_size; // end offset in the module bytes. }; // Static representation of a wasm indirect call table. struct WasmIndirectFunctionTable { uint32_t min_size; // minimum table size. uint32_t max_size; // maximum table size. bool has_max; // true if there is a maximum size. // TODO(titzer): Move this to WasmInstance. Needed by interpreter only. std::vector<int32_t> values; // function table, -1 indicating invalid. bool imported; // true if imported. bool exported; // true if exported. SignatureMap map; // canonicalizing map for sig indexes. }; // Static representation of how to initialize a table. struct WasmTableInit { uint32_t table_index; WasmInitExpr offset; std::vector<uint32_t> entries; }; // Static representation of a WASM import. struct WasmImport { uint32_t module_name_length; // length in bytes of the module name. uint32_t module_name_offset; // offset in module bytes of the module name. uint32_t field_name_length; // length in bytes of the import name. uint32_t field_name_offset; // offset in module bytes of the import name. WasmExternalKind kind; // kind of the import. uint32_t index; // index into the respective space. }; // Static representation of a WASM export. struct WasmExport { uint32_t name_length; // length in bytes of the exported name. uint32_t name_offset; // offset in module bytes of the name to export. WasmExternalKind kind; // kind of the export. uint32_t index; // index into the respective space. }; enum ModuleOrigin { kWasmOrigin, kAsmJsOrigin }; class WasmCompiledModule; // Static representation of a module. struct V8_EXPORT_PRIVATE WasmModule { static const uint32_t kPageSize = 0x10000; // Page size, 64kb. static const uint32_t kMinMemPages = 1; // Minimum memory size = 64kb static const size_t kV8MaxPages = 16384; // Maximum memory size = 1gb static const size_t kV8MaxTableSize = 16 * 1024 * 1024; Zone* owned_zone; const byte* module_start = nullptr; // starting address for the module bytes const byte* module_end = nullptr; // end address for the module bytes uint32_t min_mem_pages = 0; // minimum size of the memory in 64k pages uint32_t max_mem_pages = 0; // maximum size of the memory in 64k pages bool mem_export = false; // true if the memory is exported // TODO(wasm): reconcile start function index being an int with // the fact that we index on uint32_t, so we may technically not be // able to represent some start_function_index -es. int start_function_index = -1; // start function, if any ModuleOrigin origin = kWasmOrigin; // origin of the module std::vector<WasmGlobal> globals; // globals in this module. uint32_t globals_size = 0; // size of globals table. uint32_t num_imported_functions = 0; // number of imported functions. uint32_t num_declared_functions = 0; // number of declared functions. uint32_t num_exported_functions = 0; // number of exported functions. std::vector<FunctionSig*> signatures; // signatures in this module. std::vector<WasmFunction> functions; // functions in this module. std::vector<WasmDataSegment> data_segments; // data segments in this module. std::vector<WasmIndirectFunctionTable> function_tables; // function tables. std::vector<WasmImport> import_table; // import table. std::vector<WasmExport> export_table; // export table. std::vector<WasmTableInit> table_inits; // initializations of tables // We store the semaphore here to extend its lifetime. In <libc-2.21, which we // use on the try bots, semaphore::Wait() can return while some compilation // tasks are still executing semaphore::Signal(). If the semaphore is cleaned // up right after semaphore::Wait() returns, then this can cause an // invalid-semaphore error in the compilation tasks. // TODO(wasm): Move this semaphore back to CompileInParallel when the try bots // switch to libc-2.21 or higher. std::unique_ptr<base::Semaphore> pending_tasks; WasmModule() : WasmModule(nullptr, nullptr) {} WasmModule(Zone* owned_zone, const byte* module_start); ~WasmModule() { if (owned_zone) delete owned_zone; } // Get a string stored in the module bytes representing a name. WasmName GetName(uint32_t offset, uint32_t length) const { if (length == 0) return {"<?>", 3}; // no name. CHECK(BoundsCheck(offset, offset + length)); DCHECK_GE(static_cast<int>(length), 0); return {reinterpret_cast<const char*>(module_start + offset), static_cast<int>(length)}; } // Get a string stored in the module bytes representing a function name. WasmName GetName(WasmFunction* function) const { return GetName(function->name_offset, function->name_length); } // Get a string stored in the module bytes representing a name. WasmName GetNameOrNull(uint32_t offset, uint32_t length) const { if (offset == 0 && length == 0) return {NULL, 0}; // no name. CHECK(BoundsCheck(offset, offset + length)); DCHECK_GE(static_cast<int>(length), 0); return {reinterpret_cast<const char*>(module_start + offset), static_cast<int>(length)}; } // Get a string stored in the module bytes representing a function name. WasmName GetNameOrNull(const WasmFunction* function) const { return GetNameOrNull(function->name_offset, function->name_length); } // Checks the given offset range is contained within the module bytes. bool BoundsCheck(uint32_t start, uint32_t end) const { size_t size = module_end - module_start; return start <= size && end <= size; } // Creates a new instantiation of the module in the given isolate. static MaybeHandle<JSObject> Instantiate(Isolate* isolate, ErrorThrower* thrower, Handle<JSObject> wasm_module, Handle<JSReceiver> ffi, Handle<JSArrayBuffer> memory); MaybeHandle<WasmCompiledModule> CompileFunctions( Isolate* isolate, Handle<Managed<WasmModule>> module_wrapper, ErrorThrower* thrower) const; }; typedef Managed<WasmModule> WasmModuleWrapper; // An instantiated WASM module, including memory, function table, etc. struct WasmInstance { const WasmModule* module; // static representation of the module. // -- Heap allocated -------------------------------------------------------- Handle<JSObject> js_object; // JavaScript module object. Handle<Context> context; // JavaScript native context. Handle<JSArrayBuffer> mem_buffer; // Handle to array buffer of memory. Handle<JSArrayBuffer> globals_buffer; // Handle to array buffer of globals. std::vector<Handle<FixedArray>> function_tables; // indirect function tables. std::vector<Handle<Code>> function_code; // code objects for each function. // -- raw memory ------------------------------------------------------------ byte* mem_start = nullptr; // start of linear memory. uint32_t mem_size = 0; // size of the linear memory. // -- raw globals ----------------------------------------------------------- byte* globals_start = nullptr; // start of the globals area. explicit WasmInstance(const WasmModule* m) : module(m), function_tables(m->function_tables.size()), function_code(m->functions.size()) {} }; // Interface provided to the decoder/graph builder which contains only // minimal information about the globals, functions, and function tables. struct V8_EXPORT_PRIVATE ModuleEnv { const WasmModule* module; WasmInstance* instance; ModuleOrigin origin; bool IsValidGlobal(uint32_t index) const { return module && index < module->globals.size(); } bool IsValidFunction(uint32_t index) const { return module && index < module->functions.size(); } bool IsValidSignature(uint32_t index) const { return module && index < module->signatures.size(); } bool IsValidTable(uint32_t index) const { return module && index < module->function_tables.size(); } LocalType GetGlobalType(uint32_t index) { DCHECK(IsValidGlobal(index)); return module->globals[index].type; } FunctionSig* GetFunctionSignature(uint32_t index) { DCHECK(IsValidFunction(index)); return module->functions[index].sig; } FunctionSig* GetSignature(uint32_t index) { DCHECK(IsValidSignature(index)); return module->signatures[index]; } const WasmIndirectFunctionTable* GetTable(uint32_t index) const { DCHECK(IsValidTable(index)); return &module->function_tables[index]; } bool asm_js() { return origin == kAsmJsOrigin; } Handle<Code> GetFunctionCode(uint32_t index) { DCHECK_NOT_NULL(instance); return instance->function_code[index]; } static compiler::CallDescriptor* GetWasmCallDescriptor(Zone* zone, FunctionSig* sig); static compiler::CallDescriptor* GetI32WasmCallDescriptor( Zone* zone, compiler::CallDescriptor* descriptor); static compiler::CallDescriptor* GetI32WasmCallDescriptorForSimd( Zone* zone, compiler::CallDescriptor* descriptor); }; // A helper for printing out the names of functions. struct WasmFunctionName { const WasmFunction* function_; const WasmModule* module_; WasmFunctionName(const WasmFunction* function, const ModuleEnv* menv) : function_(function), module_(menv ? menv->module : nullptr) {} }; std::ostream& operator<<(std::ostream& os, const WasmModule& module); std::ostream& operator<<(std::ostream& os, const WasmFunction& function); std::ostream& operator<<(std::ostream& os, const WasmFunctionName& name); class WasmCompiledModule : public FixedArray { public: static WasmCompiledModule* cast(Object* fixed_array) { SLOW_DCHECK(IsWasmCompiledModule(fixed_array)); return reinterpret_cast<WasmCompiledModule*>(fixed_array); } #define WCM_OBJECT_OR_WEAK(TYPE, NAME, ID) \ Handle<TYPE> NAME() const { return handle(ptr_to_##NAME()); } \ \ MaybeHandle<TYPE> maybe_##NAME() const { \ if (has_##NAME()) return NAME(); \ return MaybeHandle<TYPE>(); \ } \ \ TYPE* ptr_to_##NAME() const { \ Object* obj = get(ID); \ if (!obj->Is##TYPE()) return nullptr; \ return TYPE::cast(obj); \ } \ \ void set_##NAME(Handle<TYPE> value) { set_ptr_to_##NAME(*value); } \ \ void set_ptr_to_##NAME(TYPE* value) { set(ID, value); } \ \ bool has_##NAME() const { return get(ID)->Is##TYPE(); } \ \ void reset_##NAME() { set_undefined(ID); } #define WCM_OBJECT(TYPE, NAME) WCM_OBJECT_OR_WEAK(TYPE, NAME, kID_##NAME) #define WCM_SMALL_NUMBER(TYPE, NAME) \ TYPE NAME() const { \ return static_cast<TYPE>(Smi::cast(get(kID_##NAME))->value()); \ } \ void set_##NAME(TYPE value) { set(kID_##NAME, Smi::FromInt(value)); } #define WCM_WEAK_LINK(TYPE, NAME) \ WCM_OBJECT_OR_WEAK(WeakCell, weak_##NAME, kID_##NAME); \ \ Handle<TYPE> NAME() const { \ return handle(TYPE::cast(weak_##NAME()->value())); \ } #define CORE_WCM_PROPERTY_TABLE(MACRO) \ MACRO(OBJECT, FixedArray, code_table) \ MACRO(OBJECT, Foreign, module_wrapper) \ MACRO(OBJECT, SeqOneByteString, module_bytes) \ MACRO(OBJECT, Script, asm_js_script) \ MACRO(OBJECT, FixedArray, function_tables) \ MACRO(OBJECT, FixedArray, empty_function_tables) \ MACRO(OBJECT, ByteArray, asm_js_offset_tables) \ MACRO(OBJECT, JSArrayBuffer, memory) \ MACRO(SMALL_NUMBER, uint32_t, min_mem_pages) \ MACRO(WEAK_LINK, WasmCompiledModule, next_instance) \ MACRO(WEAK_LINK, WasmCompiledModule, prev_instance) \ MACRO(WEAK_LINK, JSObject, owning_instance) \ MACRO(WEAK_LINK, JSObject, wasm_module) #if DEBUG #define DEBUG_ONLY_TABLE(MACRO) MACRO(SMALL_NUMBER, uint32_t, instance_id) #else #define DEBUG_ONLY_TABLE(IGNORE) uint32_t instance_id() const { return -1; } #endif #define WCM_PROPERTY_TABLE(MACRO) \ CORE_WCM_PROPERTY_TABLE(MACRO) \ DEBUG_ONLY_TABLE(MACRO) private: enum PropertyIndices { #define INDICES(IGNORE1, IGNORE2, NAME) kID_##NAME, WCM_PROPERTY_TABLE(INDICES) Count #undef INDICES }; public: static Handle<WasmCompiledModule> New( Isolate* isolate, Handle<Managed<WasmModule>> module_wrapper); static Handle<WasmCompiledModule> Clone(Isolate* isolate, Handle<WasmCompiledModule> module) { Handle<WasmCompiledModule> ret = Handle<WasmCompiledModule>::cast( isolate->factory()->CopyFixedArray(module)); ret->InitId(); ret->reset_weak_owning_instance(); ret->reset_weak_next_instance(); ret->reset_weak_prev_instance(); return ret; } uint32_t mem_size() const { return has_memory() ? memory()->byte_length()->Number() : default_mem_size(); } uint32_t default_mem_size() const { return min_mem_pages() * WasmModule::kPageSize; } #define DECLARATION(KIND, TYPE, NAME) WCM_##KIND(TYPE, NAME) WCM_PROPERTY_TABLE(DECLARATION) #undef DECLARATION static bool IsWasmCompiledModule(Object* obj); void PrintInstancesChain(); static void RecreateModuleWrapper(Isolate* isolate, Handle<FixedArray> compiled_module); private: void InitId(); DISALLOW_IMPLICIT_CONSTRUCTORS(WasmCompiledModule); }; // Extract a function name from the given wasm object. // Returns "<WASM UNNAMED>" if the function is unnamed or the name is not a // valid UTF-8 string. Handle<String> GetWasmFunctionName(Isolate* isolate, Handle<Object> wasm, uint32_t func_index); // Extract a function name from the given wasm object. // Returns a null handle if the function is unnamed or the name is not a valid // UTF-8 string. Handle<Object> GetWasmFunctionNameOrNull(Isolate* isolate, Handle<Object> wasm, uint32_t func_index); // Return the binary source bytes of a wasm module. Handle<SeqOneByteString> GetWasmBytes(Handle<JSObject> wasm); // Get the debug info associated with the given wasm object. // If no debug info exists yet, it is created automatically. Handle<WasmDebugInfo> GetDebugInfo(Handle<JSObject> wasm); // Return the number of functions in the given wasm object. int GetNumberOfFunctions(Handle<JSObject> wasm); // Create and export JSFunction Handle<JSFunction> WrapExportCodeAsJSFunction(Isolate* isolate, Handle<Code> export_code, Handle<String> name, FunctionSig* sig, int func_index, Handle<JSObject> instance); // Check whether the given object represents a WebAssembly.Instance instance. // This checks the number and type of internal fields, so it's not 100 percent // secure. If it turns out that we need more complete checks, we could add a // special marker as internal field, which will definitely never occur anywhere // else. bool IsWasmInstance(Object* instance); // Return the compiled module object for this WASM instance. WasmCompiledModule* GetCompiledModule(Object* wasm_instance); // Check whether the wasm module was generated from asm.js code. bool WasmIsAsmJs(Object* instance, Isolate* isolate); // Get the script for the asm.js origin of the wasm module. Handle<Script> GetAsmWasmScript(Handle<JSObject> instance); // Get the asm.js source position for the given byte offset in the given // function. int GetAsmWasmSourcePosition(Handle<JSObject> instance, int func_index, int byte_offset); // Constructs a single function table as a FixedArray of double size, // populating it with function signature indices and function indices. Handle<FixedArray> BuildFunctionTable(Isolate* isolate, uint32_t index, const WasmModule* module); // Populates a function table by replacing function indices with handles to // the compiled code. void PopulateFunctionTable(Handle<FixedArray> table, uint32_t table_size, const std::vector<Handle<Code>>* code_table); Handle<JSObject> CreateWasmModuleObject( Isolate* isolate, Handle<WasmCompiledModule> compiled_module, ModuleOrigin origin); V8_EXPORT_PRIVATE MaybeHandle<JSObject> CreateModuleObjectFromBytes( Isolate* isolate, const byte* start, const byte* end, ErrorThrower* thrower, ModuleOrigin origin, Handle<Script> asm_js_script, const byte* asm_offset_tables_start, const byte* asm_offset_tables_end); V8_EXPORT_PRIVATE bool ValidateModuleBytes(Isolate* isolate, const byte* start, const byte* end, ErrorThrower* thrower, ModuleOrigin origin); // Get the number of imported functions for a WASM instance. int GetNumImportedFunctions(Handle<JSObject> instance); // Assumed to be called with a code object associated to a wasm module instance. // Intended to be called from runtime functions. // Returns nullptr on failing to get owning instance. Object* GetOwningWasmInstance(Code* code); MaybeHandle<JSArrayBuffer> GetInstanceMemory(Isolate* isolate, Handle<JSObject> instance); int32_t GetInstanceMemorySize(Isolate* isolate, Handle<JSObject> instance); int32_t GrowInstanceMemory(Isolate* isolate, Handle<JSObject> instance, uint32_t pages); void UpdateDispatchTables(Isolate* isolate, Handle<FixedArray> dispatch_tables, int index, Handle<JSFunction> js_function); namespace testing { void ValidateInstancesChain(Isolate* isolate, Handle<JSObject> wasm_module, int instance_count); void ValidateModuleState(Isolate* isolate, Handle<JSObject> wasm_module); void ValidateOrphanedInstance(Isolate* isolate, Handle<JSObject> instance); } // namespace testing } // namespace wasm } // namespace internal } // namespace v8 #endif // V8_WASM_MODULE_H_