summaryrefslogtreecommitdiff
path: root/deps/v8/src/wasm/module-decoder.cc
diff options
context:
space:
mode:
Diffstat (limited to 'deps/v8/src/wasm/module-decoder.cc')
-rw-r--r--deps/v8/src/wasm/module-decoder.cc1079
1 files changed, 688 insertions, 391 deletions
diff --git a/deps/v8/src/wasm/module-decoder.cc b/deps/v8/src/wasm/module-decoder.cc
index 542c47ca15..90065616d9 100644
--- a/deps/v8/src/wasm/module-decoder.cc
+++ b/deps/v8/src/wasm/module-decoder.cc
@@ -27,6 +27,141 @@ namespace wasm {
namespace {
+const char* kNameString = "name";
+const size_t kNameStringLength = 4;
+
+LocalType TypeOf(const WasmModule* module, const WasmInitExpr& expr) {
+ switch (expr.kind) {
+ case WasmInitExpr::kNone:
+ return kAstStmt;
+ case WasmInitExpr::kGlobalIndex:
+ return expr.val.global_index < module->globals.size()
+ ? module->globals[expr.val.global_index].type
+ : kAstStmt;
+ case WasmInitExpr::kI32Const:
+ return kAstI32;
+ case WasmInitExpr::kI64Const:
+ return kAstI64;
+ case WasmInitExpr::kF32Const:
+ return kAstF32;
+ case WasmInitExpr::kF64Const:
+ return kAstF64;
+ default:
+ UNREACHABLE();
+ return kAstStmt;
+ }
+}
+
+// An iterator over the sections in a WASM binary module.
+// Automatically skips all unknown sections.
+class WasmSectionIterator {
+ public:
+ explicit WasmSectionIterator(Decoder& decoder)
+ : decoder_(decoder),
+ section_code_(kUnknownSectionCode),
+ section_start_(decoder.pc()),
+ section_end_(decoder.pc()) {
+ next();
+ }
+
+ inline bool more() const {
+ return section_code_ != kUnknownSectionCode && decoder_.more();
+ }
+
+ inline WasmSectionCode section_code() const { return section_code_; }
+
+ inline const byte* section_start() const { return section_start_; }
+
+ inline uint32_t section_length() const {
+ return static_cast<uint32_t>(section_end_ - section_start_);
+ }
+
+ inline const byte* section_end() const { return section_end_; }
+
+ // Advances to the next section, checking that decoding the current section
+ // stopped at {section_end_}.
+ void advance() {
+ if (decoder_.pc() != section_end_) {
+ const char* msg = decoder_.pc() < section_end_ ? "shorter" : "longer";
+ decoder_.error(decoder_.pc(), decoder_.pc(),
+ "section was %s than expected size "
+ "(%u bytes expected, %zu decoded)",
+ msg, section_length(),
+ static_cast<size_t>(decoder_.pc() - section_start_));
+ }
+ next();
+ }
+
+ private:
+ Decoder& decoder_;
+ WasmSectionCode section_code_;
+ const byte* section_start_;
+ const byte* section_end_;
+
+ // Reads the section code/name at the current position and sets up
+ // the internal fields.
+ void next() {
+ while (true) {
+ if (!decoder_.more()) {
+ section_code_ = kUnknownSectionCode;
+ return;
+ }
+ uint8_t section_code = decoder_.consume_u8("section code");
+ // Read and check the section size.
+ uint32_t section_length = decoder_.consume_u32v("section length");
+ section_start_ = decoder_.pc();
+ if (decoder_.checkAvailable(section_length)) {
+ // Get the limit of the section within the module.
+ section_end_ = section_start_ + section_length;
+ } else {
+ // The section would extend beyond the end of the module.
+ section_end_ = section_start_;
+ }
+
+ if (section_code == kUnknownSectionCode) {
+ // Check for the known "names" section.
+ uint32_t string_length = decoder_.consume_u32v("section name length");
+ const byte* section_name_start = decoder_.pc();
+ decoder_.consume_bytes(string_length, "section name");
+ if (decoder_.failed() || decoder_.pc() > section_end_) {
+ TRACE("Section name of length %u couldn't be read\n", string_length);
+ section_code_ = kUnknownSectionCode;
+ return;
+ }
+
+ TRACE(" +%d section name : \"%.*s\"\n",
+ static_cast<int>(section_name_start - decoder_.start()),
+ string_length < 20 ? string_length : 20, section_name_start);
+
+ if (string_length == kNameStringLength &&
+ strncmp(reinterpret_cast<const char*>(section_name_start),
+ kNameString, kNameStringLength) == 0) {
+ section_code = kNameSectionCode;
+ } else {
+ section_code = kUnknownSectionCode;
+ }
+ } else if (!IsValidSectionCode(section_code)) {
+ decoder_.error(decoder_.pc(), decoder_.pc(),
+ "unknown section code #0x%02x", section_code);
+ section_code = kUnknownSectionCode;
+ }
+ section_code_ = static_cast<WasmSectionCode>(section_code);
+
+ TRACE("Section: %s\n", SectionName(section_code_));
+ if (section_code_ == kUnknownSectionCode &&
+ section_end_ > decoder_.pc()) {
+ // skip to the end of the unknown section.
+ uint32_t remaining =
+ static_cast<uint32_t>(section_end_ - decoder_.pc());
+ decoder_.consume_bytes(remaining, "section payload");
+ // fall through and continue to the next section.
+ } else {
+ return;
+ }
+ }
+ }
+};
+
// The main logic for decoding the bytes of a module.
class ModuleDecoder : public Decoder {
public:
@@ -77,11 +212,9 @@ class ModuleDecoder : public Decoder {
module->min_mem_pages = 0;
module->max_mem_pages = 0;
module->mem_export = false;
- module->mem_external = false;
module->origin = origin_;
const byte* pos = pc_;
- int current_order = 0;
uint32_t magic_word = consume_u32("wasm magic");
#define BYTES(x) (x & 0xff), (x >> 8) & 0xff, (x >> 16) & 0xff, (x >> 24) & 0xff
if (magic_word != kWasmMagic) {
@@ -89,7 +222,6 @@ class ModuleDecoder : public Decoder {
"expected magic word %02x %02x %02x %02x, "
"found %02x %02x %02x %02x",
BYTES(kWasmMagic), BYTES(magic_word));
- goto done;
}
pos = pc_;
@@ -100,302 +232,367 @@ class ModuleDecoder : public Decoder {
"expected version %02x %02x %02x %02x, "
"found %02x %02x %02x %02x",
BYTES(kWasmVersion), BYTES(magic_version));
- goto done;
}
}
- // Decode the module sections.
- while (pc_ < limit_) {
- TRACE("DecodeSection\n");
- pos = pc_;
-
- // Read the section name.
- uint32_t string_length = consume_u32v("section name length");
- const byte* section_name_start = pc_;
- consume_bytes(string_length);
- if (failed()) {
- TRACE("Section name of length %u couldn't be read\n", string_length);
- break;
+ WasmSectionIterator section_iter(*this);
+
+ // ===== Type section ====================================================
+ if (section_iter.section_code() == kTypeSectionCode) {
+ uint32_t signatures_count = consume_u32v("signatures count");
+ module->signatures.reserve(SafeReserve(signatures_count));
+ for (uint32_t i = 0; ok() && i < signatures_count; ++i) {
+ TRACE("DecodeSignature[%d] module+%d\n", i,
+ static_cast<int>(pc_ - start_));
+ FunctionSig* s = consume_sig();
+ module->signatures.push_back(s);
}
+ section_iter.advance();
+ }
- TRACE(" +%d section name : \"%.*s\"\n",
- static_cast<int>(section_name_start - start_),
- string_length < 20 ? string_length : 20, section_name_start);
-
- WasmSection::Code section =
- WasmSection::lookup(section_name_start, string_length);
-
- // Read and check the section size.
- uint32_t section_length = consume_u32v("section length");
- if (!checkAvailable(section_length)) {
- // The section would extend beyond the end of the module.
- break;
- }
- const byte* section_start = pc_;
- const byte* expected_section_end = pc_ + section_length;
-
- current_order = CheckSectionOrder(current_order, section);
-
- switch (section) {
- case WasmSection::Code::End:
- // Terminate section decoding.
- limit_ = pc_;
- break;
- case WasmSection::Code::Memory: {
- module->min_mem_pages = consume_u32v("min memory");
- module->max_mem_pages = consume_u32v("max memory");
- module->mem_export = consume_u8("export memory") != 0;
- break;
- }
- case WasmSection::Code::Signatures: {
- uint32_t signatures_count = consume_u32v("signatures count");
- module->signatures.reserve(SafeReserve(signatures_count));
- // Decode signatures.
- for (uint32_t i = 0; i < signatures_count; ++i) {
- if (failed()) break;
- TRACE("DecodeSignature[%d] module+%d\n", i,
- static_cast<int>(pc_ - start_));
- FunctionSig* s = consume_sig();
- module->signatures.push_back(s);
- }
- break;
+ // ===== Import section ==================================================
+ if (section_iter.section_code() == kImportSectionCode) {
+ uint32_t import_table_count = consume_u32v("import table count");
+ module->import_table.reserve(SafeReserve(import_table_count));
+ for (uint32_t i = 0; ok() && i < import_table_count; ++i) {
+ TRACE("DecodeImportTable[%d] module+%d\n", i,
+ static_cast<int>(pc_ - start_));
+
+ module->import_table.push_back({
+ 0, // module_name_length
+ 0, // module_name_offset
+ 0, // field_name_offset
+ 0, // field_name_length
+ kExternalFunction, // kind
+ 0 // index
+ });
+ WasmImport* import = &module->import_table.back();
+ const byte* pos = pc_;
+ import->module_name_offset =
+ consume_string(&import->module_name_length, true);
+ if (import->module_name_length == 0) {
+ error(pos, "import module name cannot be NULL");
}
- case WasmSection::Code::FunctionSignatures: {
- uint32_t functions_count = consume_u32v("functions count");
- module->functions.reserve(SafeReserve(functions_count));
- for (uint32_t i = 0; i < functions_count; ++i) {
- module->functions.push_back({nullptr, // sig
- i, // func_index
- 0, // sig_index
- 0, // name_offset
- 0, // name_length
- 0, // code_start_offset
- 0}); // code_end_offset
+ import->field_name_offset =
+ consume_string(&import->field_name_length, true);
+
+ import->kind = static_cast<WasmExternalKind>(consume_u8("import kind"));
+ switch (import->kind) {
+ case kExternalFunction: {
+ // ===== Imported function =======================================
+ import->index = static_cast<uint32_t>(module->functions.size());
+ module->num_imported_functions++;
+ module->functions.push_back({nullptr, // sig
+ import->index, // func_index
+ 0, // sig_index
+ 0, // name_offset
+ 0, // name_length
+ 0, // code_start_offset
+ 0, // code_end_offset
+ true, // imported
+ false}); // exported
WasmFunction* function = &module->functions.back();
function->sig_index = consume_sig_index(module, &function->sig);
- }
- break;
- }
- case WasmSection::Code::FunctionBodies: {
- const byte* pos = pc_;
- uint32_t functions_count = consume_u32v("functions count");
- if (functions_count != module->functions.size()) {
- error(pos, pos, "function body count %u mismatch (%u expected)",
- functions_count,
- static_cast<uint32_t>(module->functions.size()));
break;
}
- for (uint32_t i = 0; i < functions_count; ++i) {
- WasmFunction* function = &module->functions[i];
- uint32_t size = consume_u32v("body size");
- function->code_start_offset = pc_offset();
- function->code_end_offset = pc_offset() + size;
-
- TRACE(" +%d %-20s: (%d bytes)\n", pc_offset(), "function body",
- size);
- pc_ += size;
- if (pc_ > limit_) {
- error(pc_, "function body extends beyond end of file");
- }
- }
- break;
- }
- case WasmSection::Code::Names: {
- const byte* pos = pc_;
- uint32_t functions_count = consume_u32v("functions count");
- if (functions_count != module->functions.size()) {
- error(pos, pos, "function name count %u mismatch (%u expected)",
- functions_count,
- static_cast<uint32_t>(module->functions.size()));
+ case kExternalTable: {
+ // ===== Imported table ==========================================
+ import->index =
+ static_cast<uint32_t>(module->function_tables.size());
+ module->function_tables.push_back(
+ {0, 0, std::vector<int32_t>(), true, false});
+ expect_u8("element type", 0x20);
+ WasmIndirectFunctionTable* table = &module->function_tables.back();
+ consume_resizable_limits("element count", "elements", kMaxUInt32,
+ &table->size, &table->max_size);
break;
}
-
- for (uint32_t i = 0; i < functions_count; ++i) {
- WasmFunction* function = &module->functions[i];
- function->name_offset =
- consume_string(&function->name_length, false);
-
- uint32_t local_names_count = consume_u32v("local names count");
- for (uint32_t j = 0; j < local_names_count; j++) {
- uint32_t unused = 0;
- uint32_t offset = consume_string(&unused, false);
- USE(unused);
- USE(offset);
- }
+ case kExternalMemory: {
+ // ===== Imported memory =========================================
+ // import->index =
+ // static_cast<uint32_t>(module->memories.size());
+ // TODO(titzer): imported memories
+ break;
}
- break;
- }
- case WasmSection::Code::Globals: {
- uint32_t globals_count = consume_u32v("globals count");
- module->globals.reserve(SafeReserve(globals_count));
- // Decode globals.
- for (uint32_t i = 0; i < globals_count; ++i) {
- if (failed()) break;
- TRACE("DecodeGlobal[%d] module+%d\n", i,
- static_cast<int>(pc_ - start_));
- // Add an uninitialized global and pass a pointer to it.
- module->globals.push_back({0, 0, kAstStmt, 0, false});
+ case kExternalGlobal: {
+ // ===== Imported global =========================================
+ import->index = static_cast<uint32_t>(module->globals.size());
+ module->globals.push_back(
+ {kAstStmt, false, NO_INIT, 0, true, false});
WasmGlobal* global = &module->globals.back();
- DecodeGlobalInModule(global);
- }
- break;
- }
- case WasmSection::Code::DataSegments: {
- uint32_t data_segments_count = consume_u32v("data segments count");
- module->data_segments.reserve(SafeReserve(data_segments_count));
- // Decode data segments.
- for (uint32_t i = 0; i < data_segments_count; ++i) {
- if (failed()) break;
- TRACE("DecodeDataSegment[%d] module+%d\n", i,
- static_cast<int>(pc_ - start_));
- module->data_segments.push_back({0, // dest_addr
- 0, // source_offset
- 0, // source_size
- false}); // init
- WasmDataSegment* segment = &module->data_segments.back();
- DecodeDataSegmentInModule(module, segment);
+ global->type = consume_value_type();
+ global->mutability = consume_u8("mutability") != 0;
+ break;
}
- break;
+ default:
+ error(pos, pos, "unknown import kind 0x%02x", import->kind);
+ break;
}
- case WasmSection::Code::FunctionTable: {
- // An indirect function table requires functions first.
- CheckForFunctions(module, section);
- // Assume only one table for now.
- static const uint32_t kSupportedTableCount = 1;
- module->function_tables.reserve(SafeReserve(kSupportedTableCount));
- // Decode function table.
- for (uint32_t i = 0; i < kSupportedTableCount; ++i) {
- if (failed()) break;
- TRACE("DecodeFunctionTable[%d] module+%d\n", i,
- static_cast<int>(pc_ - start_));
- module->function_tables.push_back({0, 0, std::vector<uint16_t>()});
- DecodeFunctionTableInModule(module, &module->function_tables[i]);
+ }
+ section_iter.advance();
+ }
+
+ // ===== Function section ================================================
+ if (section_iter.section_code() == kFunctionSectionCode) {
+ uint32_t functions_count = consume_u32v("functions count");
+ module->functions.reserve(SafeReserve(functions_count));
+ module->num_declared_functions = functions_count;
+ for (uint32_t i = 0; ok() && i < functions_count; ++i) {
+ uint32_t func_index = static_cast<uint32_t>(module->functions.size());
+ module->functions.push_back({nullptr, // sig
+ func_index, // func_index
+ 0, // sig_index
+ 0, // name_offset
+ 0, // name_length
+ 0, // code_start_offset
+ 0, // code_end_offset
+ false, // imported
+ false}); // exported
+ WasmFunction* function = &module->functions.back();
+ function->sig_index = consume_sig_index(module, &function->sig);
+ }
+ section_iter.advance();
+ }
+
+ // ===== Table section ===================================================
+ if (section_iter.section_code() == kTableSectionCode) {
+ const byte* pos = pc_;
+ uint32_t table_count = consume_u32v("table count");
+ // Require at most one table for now.
+ if (table_count > 1) {
+ error(pos, pos, "invalid table count %d, maximum 1", table_count);
+ }
+
+ for (uint32_t i = 0; ok() && i < table_count; i++) {
+ module->function_tables.push_back(
+ {0, 0, std::vector<int32_t>(), false, false});
+ WasmIndirectFunctionTable* table = &module->function_tables.back();
+ expect_u8("table type", kWasmAnyFunctionTypeForm);
+ consume_resizable_limits("table elements", "elements", kMaxUInt32,
+ &table->size, &table->max_size);
+ }
+ section_iter.advance();
+ }
+
+ // ===== Memory section ==================================================
+ if (section_iter.section_code() == kMemorySectionCode) {
+ const byte* pos = pc_;
+ uint32_t memory_count = consume_u32v("memory count");
+ // Require at most one memory for now.
+ if (memory_count > 1) {
+ error(pos, pos, "invalid memory count %d, maximum 1", memory_count);
+ }
+
+ for (uint32_t i = 0; ok() && i < memory_count; i++) {
+ consume_resizable_limits("memory", "pages", WasmModule::kMaxLegalPages,
+ &module->min_mem_pages,
+ &module->max_mem_pages);
+ }
+ section_iter.advance();
+ }
+
+ // ===== Global section ==================================================
+ if (section_iter.section_code() == kGlobalSectionCode) {
+ uint32_t globals_count = consume_u32v("globals count");
+ module->globals.reserve(SafeReserve(globals_count));
+ for (uint32_t i = 0; ok() && i < globals_count; ++i) {
+ TRACE("DecodeGlobal[%d] module+%d\n", i,
+ static_cast<int>(pc_ - start_));
+ // Add an uninitialized global and pass a pointer to it.
+ module->globals.push_back({kAstStmt, false, NO_INIT, 0, false, false});
+ WasmGlobal* global = &module->globals.back();
+ DecodeGlobalInModule(module, i, global);
+ }
+ section_iter.advance();
+ }
+
+ // ===== Export section ==================================================
+ if (section_iter.section_code() == kExportSectionCode) {
+ uint32_t export_table_count = consume_u32v("export table count");
+ module->export_table.reserve(SafeReserve(export_table_count));
+ for (uint32_t i = 0; ok() && i < export_table_count; ++i) {
+ TRACE("DecodeExportTable[%d] module+%d\n", i,
+ static_cast<int>(pc_ - start_));
+
+ module->export_table.push_back({
+ 0, // name_length
+ 0, // name_offset
+ kExternalFunction, // kind
+ 0 // index
+ });
+ WasmExport* exp = &module->export_table.back();
+
+ exp->name_offset = consume_string(&exp->name_length, true);
+ const byte* pos = pc();
+ exp->kind = static_cast<WasmExternalKind>(consume_u8("export kind"));
+ switch (exp->kind) {
+ case kExternalFunction: {
+ WasmFunction* func = nullptr;
+ exp->index = consume_func_index(module, &func);
+ module->num_exported_functions++;
+ if (func) func->exported = true;
+ break;
}
- break;
- }
- case WasmSection::Code::StartFunction: {
- // Declares a start function for a module.
- CheckForFunctions(module, section);
- if (module->start_function_index >= 0) {
- error("start function already declared");
+ case kExternalTable: {
+ WasmIndirectFunctionTable* table = nullptr;
+ exp->index = consume_table_index(module, &table);
+ if (table) table->exported = true;
break;
}
- WasmFunction* func;
- const byte* pos = pc_;
- module->start_function_index = consume_func_index(module, &func);
- if (func && func->sig->parameter_count() > 0) {
- error(pos, "invalid start function: non-zero parameter count");
+ case kExternalMemory: {
+ uint32_t index = consume_u32v("memory index");
+ if (index != 0) error("invalid memory index != 0");
+ module->mem_export = true;
break;
}
- break;
- }
- case WasmSection::Code::ImportTable: {
- uint32_t import_table_count = consume_u32v("import table count");
- module->import_table.reserve(SafeReserve(import_table_count));
- // Decode import table.
- for (uint32_t i = 0; i < import_table_count; ++i) {
- if (failed()) break;
- TRACE("DecodeImportTable[%d] module+%d\n", i,
- static_cast<int>(pc_ - start_));
-
- module->import_table.push_back({nullptr, // sig
- 0, // sig_index
- 0, // module_name_offset
- 0, // module_name_length
- 0, // function_name_offset
- 0}); // function_name_length
- WasmImport* import = &module->import_table.back();
-
- import->sig_index = consume_sig_index(module, &import->sig);
- const byte* pos = pc_;
- import->module_name_offset =
- consume_string(&import->module_name_length, true);
- if (import->module_name_length == 0) {
- error(pos, "import module name cannot be NULL");
- }
- import->function_name_offset =
- consume_string(&import->function_name_length, true);
+ case kExternalGlobal: {
+ WasmGlobal* global = nullptr;
+ exp->index = consume_global_index(module, &global);
+ if (global) global->exported = true;
+ break;
}
- break;
+ default:
+ error(pos, pos, "invalid export kind 0x%02x", exp->kind);
+ break;
}
- case WasmSection::Code::ExportTable: {
- // Declares an export table.
- CheckForFunctions(module, section);
- uint32_t export_table_count = consume_u32v("export table count");
- module->export_table.reserve(SafeReserve(export_table_count));
- // Decode export table.
- for (uint32_t i = 0; i < export_table_count; ++i) {
- if (failed()) break;
- TRACE("DecodeExportTable[%d] module+%d\n", i,
- static_cast<int>(pc_ - start_));
-
- module->export_table.push_back({0, // func_index
- 0, // name_offset
- 0}); // name_length
- WasmExport* exp = &module->export_table.back();
-
- WasmFunction* func;
- exp->func_index = consume_func_index(module, &func);
- exp->name_offset = consume_string(&exp->name_length, true);
+ }
+ // Check for duplicate exports.
+ if (ok() && module->export_table.size() > 1) {
+ std::vector<WasmExport> sorted_exports(module->export_table);
+ const byte* base = start_;
+ auto cmp_less = [base](const WasmExport& a, const WasmExport& b) {
+ // Return true if a < b.
+ if (a.name_length != b.name_length) {
+ return a.name_length < b.name_length;
}
- // Check for duplicate exports.
- if (ok() && module->export_table.size() > 1) {
- std::vector<WasmExport> sorted_exports(module->export_table);
- const byte* base = start_;
- auto cmp_less = [base](const WasmExport& a, const WasmExport& b) {
- // Return true if a < b.
- uint32_t len = a.name_length;
- if (len != b.name_length) return len < b.name_length;
- return memcmp(base + a.name_offset, base + b.name_offset, len) <
- 0;
- };
- std::stable_sort(sorted_exports.begin(), sorted_exports.end(),
- cmp_less);
- auto it = sorted_exports.begin();
- WasmExport* last = &*it++;
- for (auto end = sorted_exports.end(); it != end; last = &*it++) {
- DCHECK(!cmp_less(*it, *last)); // Vector must be sorted.
- if (!cmp_less(*last, *it)) {
- const byte* pc = start_ + it->name_offset;
- error(pc, pc,
- "Duplicate export name '%.*s' for functions %d and %d",
- it->name_length, pc, last->func_index, it->func_index);
- break;
- }
- }
+ return memcmp(base + a.name_offset, base + b.name_offset,
+ a.name_length) < 0;
+ };
+ std::stable_sort(sorted_exports.begin(), sorted_exports.end(),
+ cmp_less);
+ auto it = sorted_exports.begin();
+ WasmExport* last = &*it++;
+ for (auto end = sorted_exports.end(); it != end; last = &*it++) {
+ DCHECK(!cmp_less(*it, *last)); // Vector must be sorted.
+ if (!cmp_less(*last, *it)) {
+ const byte* pc = start_ + it->name_offset;
+ error(pc, pc,
+ "Duplicate export name '%.*s' for functions %d and %d",
+ it->name_length, pc, last->index, it->index);
+ break;
}
- break;
}
- case WasmSection::Code::Max:
- // Skip unknown sections.
- TRACE("Unknown section: '");
- for (uint32_t i = 0; i != string_length; ++i) {
- TRACE("%c", *(section_name_start + i));
- }
- TRACE("'\n");
- consume_bytes(section_length);
- break;
- }
-
- if (pc_ != expected_section_end) {
- const char* diff = pc_ < expected_section_end ? "shorter" : "longer";
- size_t expected_length = static_cast<size_t>(section_length);
- size_t actual_length = static_cast<size_t>(pc_ - section_start);
- error(pc_, pc_,
- "section \"%s\" %s (%zu bytes) than specified (%zu bytes)",
- WasmSection::getName(section), diff, actual_length,
- expected_length);
- break;
}
+ section_iter.advance();
+ }
+
+ // ===== Start section ===================================================
+ if (section_iter.section_code() == kStartSectionCode) {
+ WasmFunction* func;
+ const byte* pos = pc_;
+ module->start_function_index = consume_func_index(module, &func);
+ if (func && func->sig->parameter_count() > 0) {
+ error(pos, "invalid start function: non-zero parameter count");
+ }
+ section_iter.advance();
+ }
+
+ // ===== Elements section ================================================
+ if (section_iter.section_code() == kElementSectionCode) {
+ uint32_t element_count = consume_u32v("element count");
+ for (uint32_t i = 0; ok() && i < element_count; ++i) {
+ uint32_t table_index = consume_u32v("table index");
+ if (table_index != 0) error("illegal table index != 0");
+ WasmInitExpr offset = consume_init_expr(module, kAstI32);
+ uint32_t num_elem = consume_u32v("number of elements");
+ std::vector<uint32_t> vector;
+ module->table_inits.push_back({table_index, offset, vector});
+ WasmTableInit* init = &module->table_inits.back();
+ init->entries.reserve(SafeReserve(num_elem));
+ for (uint32_t j = 0; ok() && j < num_elem; j++) {
+ WasmFunction* func = nullptr;
+ init->entries.push_back(consume_func_index(module, &func));
+ }
+ }
+
+ section_iter.advance();
+ }
+
+ // ===== Code section ====================================================
+ if (section_iter.section_code() == kCodeSectionCode) {
+ const byte* pos = pc_;
+ uint32_t functions_count = consume_u32v("functions count");
+ if (functions_count != module->num_declared_functions) {
+ error(pos, pos, "function body count %u mismatch (%u expected)",
+ functions_count, module->num_declared_functions);
+ }
+ for (uint32_t i = 0; ok() && i < functions_count; ++i) {
+ WasmFunction* function =
+ &module->functions[i + module->num_imported_functions];
+ uint32_t size = consume_u32v("body size");
+ function->code_start_offset = pc_offset();
+ function->code_end_offset = pc_offset() + size;
+ consume_bytes(size, "function body");
+ }
+ section_iter.advance();
+ }
+
+ // ===== Data section ====================================================
+ if (section_iter.section_code() == kDataSectionCode) {
+ uint32_t data_segments_count = consume_u32v("data segments count");
+ module->data_segments.reserve(SafeReserve(data_segments_count));
+ for (uint32_t i = 0; ok() && i < data_segments_count; ++i) {
+ TRACE("DecodeDataSegment[%d] module+%d\n", i,
+ static_cast<int>(pc_ - start_));
+ module->data_segments.push_back({
+ NO_INIT, // dest_addr
+ 0, // source_offset
+ 0 // source_size
+ });
+ WasmDataSegment* segment = &module->data_segments.back();
+ DecodeDataSegmentInModule(module, segment);
+ }
+ section_iter.advance();
}
- done:
- if (ok()) CalculateGlobalsOffsets(module);
+ // ===== Name section ====================================================
+ if (section_iter.section_code() == kNameSectionCode) {
+ const byte* pos = pc_;
+ uint32_t functions_count = consume_u32v("functions count");
+ if (functions_count != module->num_declared_functions) {
+ error(pos, pos, "function name count %u mismatch (%u expected)",
+ functions_count, module->num_declared_functions);
+ }
+
+ for (uint32_t i = 0; ok() && i < functions_count; ++i) {
+ WasmFunction* function =
+ &module->functions[i + module->num_imported_functions];
+ function->name_offset = consume_string(&function->name_length, false);
+
+ uint32_t local_names_count = consume_u32v("local names count");
+ for (uint32_t j = 0; ok() && j < local_names_count; j++) {
+ uint32_t unused = 0;
+ uint32_t offset = consume_string(&unused, false);
+ USE(unused);
+ USE(offset);
+ }
+ }
+ section_iter.advance();
+ }
+
+ // ===== Remaining sections ==============================================
+ if (section_iter.more() && ok()) {
+ error(pc(), pc(), "unexpected section: %s",
+ SectionName(section_iter.section_code()));
+ }
+
+ if (ok()) {
+ CalculateGlobalOffsets(module);
+ PreinitializeIndirectFunctionTables(module);
+ }
const WasmModule* finished_module = module;
ModuleResult result = toResult(finished_module);
- if (FLAG_dump_wasm_module) {
- DumpModule(module, result);
- }
+ if (FLAG_dump_wasm_module) DumpModule(module, result);
return result;
}
@@ -405,27 +602,6 @@ class ModuleDecoder : public Decoder {
return count < kMaxReserve ? count : kMaxReserve;
}
- void CheckForFunctions(WasmModule* module, WasmSection::Code section) {
- if (module->functions.size() == 0) {
- error(pc_ - 1, nullptr, "functions must appear before section %s",
- WasmSection::getName(section));
- }
- }
-
- int CheckSectionOrder(int current_order, WasmSection::Code section) {
- int next_order = WasmSection::getOrder(section);
- if (next_order == 0) return current_order;
- if (next_order == current_order) {
- error(pc_, pc_, "section \"%s\" already defined",
- WasmSection::getName(section));
- }
- if (next_order < current_order) {
- error(pc_, pc_, "section \"%s\" out of order",
- WasmSection::getName(section));
- }
- return next_order;
- }
-
// Decodes a single anonymous function starting at {start_}.
FunctionResult DecodeSingleFunction(ModuleEnv* module_env,
WasmFunction* function) {
@@ -451,6 +627,11 @@ class ModuleDecoder : public Decoder {
return ok() ? result : nullptr;
}
+ WasmInitExpr DecodeInitExpr(const byte* start) {
+ pc_ = start;
+ return consume_init_expr(nullptr, kAstStmt);
+ }
+
private:
Zone* module_zone;
ModuleResult result_;
@@ -459,15 +640,28 @@ class ModuleDecoder : public Decoder {
uint32_t off(const byte* ptr) { return static_cast<uint32_t>(ptr - start_); }
// Decodes a single global entry inside a module starting at {pc_}.
- void DecodeGlobalInModule(WasmGlobal* global) {
- global->name_offset = consume_string(&global->name_length, false);
- if (!unibrow::Utf8::Validate(start_ + global->name_offset,
- global->name_length)) {
- error("global name is not valid utf8");
+ void DecodeGlobalInModule(WasmModule* module, uint32_t index,
+ WasmGlobal* global) {
+ global->type = consume_value_type();
+ global->mutability = consume_u8("mutability") != 0;
+ const byte* pos = pc();
+ global->init = consume_init_expr(module, kAstStmt);
+ switch (global->init.kind) {
+ case WasmInitExpr::kGlobalIndex:
+ if (global->init.val.global_index >= index) {
+ error("invalid global index in init expression");
+ } else if (module->globals[index].type != global->type) {
+ error("type mismatch in global initialization");
+ }
+ break;
+ default:
+ if (global->type != TypeOf(module, global->init)) {
+ error(pos, pos,
+ "type error in global initialization, expected %s, got %s",
+ WasmOpcodes::TypeName(global->type),
+ WasmOpcodes::TypeName(TypeOf(module, global->init)));
+ }
}
- global->type = consume_local_type();
- global->offset = 0;
- global->exported = consume_u8("exported") != 0;
}
bool IsWithinLimit(uint32_t limit, uint32_t offset, uint32_t size) {
@@ -479,10 +673,10 @@ class ModuleDecoder : public Decoder {
// Decodes a single data segment entry inside a module starting at {pc_}.
void DecodeDataSegmentInModule(WasmModule* module, WasmDataSegment* segment) {
const byte* start = pc_;
- segment->dest_addr = consume_u32v("destination");
+ expect_u8("linear memory index", 0);
+ segment->dest_addr = consume_init_expr(module, kAstI32);
segment->source_size = consume_u32v("source size");
segment->source_offset = static_cast<uint32_t>(pc_ - start_);
- segment->init = true;
// Validate the data is in the module.
uint32_t module_limit = static_cast<uint32_t>(limit_ - start_);
@@ -491,40 +685,11 @@ class ModuleDecoder : public Decoder {
error(start, "segment out of bounds of module");
}
- // Validate that the segment will fit into the (minimum) memory.
- uint32_t memory_limit =
- WasmModule::kPageSize * (module ? module->min_mem_pages
- : WasmModule::kMaxMemPages);
- if (!IsWithinLimit(memory_limit, segment->dest_addr,
- segment->source_size)) {
- error(start, "segment out of bounds of memory");
- }
-
- consume_bytes(segment->source_size);
- }
-
- // Decodes a single function table inside a module starting at {pc_}.
- void DecodeFunctionTableInModule(WasmModule* module,
- WasmIndirectFunctionTable* table) {
- table->size = consume_u32v("function table entry count");
- table->max_size = table->size;
-
- if (table->max_size != table->size) {
- error("invalid table maximum size");
- }
-
- for (uint32_t i = 0; i < table->size; ++i) {
- uint16_t index = consume_u32v();
- if (index >= module->functions.size()) {
- error(pc_ - sizeof(index), "invalid function index");
- break;
- }
- table->values.push_back(index);
- }
+ consume_bytes(segment->source_size, "segment data");
}
// Calculate individual global offsets and total size of globals table.
- void CalculateGlobalsOffsets(WasmModule* module) {
+ void CalculateGlobalOffsets(WasmModule* module) {
uint32_t offset = 0;
if (module->globals.size() == 0) {
module->globals_size = 0;
@@ -540,6 +705,30 @@ class ModuleDecoder : public Decoder {
module->globals_size = offset;
}
+ // TODO(titzer): this only works without overlapping initializations from
+ // global bases for entries
+ void PreinitializeIndirectFunctionTables(WasmModule* module) {
+ // Fill all tables with invalid entries first.
+ for (WasmIndirectFunctionTable& table : module->function_tables) {
+ table.values.resize(table.size);
+ for (size_t i = 0; i < table.size; i++) {
+ table.values[i] = kInvalidFunctionIndex;
+ }
+ }
+ for (WasmTableInit& init : module->table_inits) {
+ if (init.offset.kind != WasmInitExpr::kI32Const) continue;
+ if (init.table_index >= module->function_tables.size()) continue;
+ WasmIndirectFunctionTable& table =
+ module->function_tables[init.table_index];
+ for (size_t i = 0; i < init.entries.size(); i++) {
+ size_t index = i + init.offset.val.i32_const;
+ if (index < table.values.size()) {
+ table.values[index] = init.entries[i];
+ }
+ }
+ }
+ }
+
// Verifies the body (code) of a given function.
void VerifyFunctionBody(uint32_t func_num, ModuleEnv* menv,
WasmFunction* function) {
@@ -570,26 +759,18 @@ class ModuleDecoder : public Decoder {
}
}
- // Reads a single 32-bit unsigned integer interpreted as an offset, checking
- // the offset is within bounds and advances.
- uint32_t consume_offset(const char* name = nullptr) {
- uint32_t offset = consume_u32(name ? name : "offset");
- if (offset > static_cast<uint32_t>(limit_ - start_)) {
- error(pc_ - sizeof(uint32_t), "offset out of bounds of module");
- }
- return offset;
- }
-
// Reads a length-prefixed string, checking that it is within bounds. Returns
// the offset of the string, and the length as an out parameter.
uint32_t consume_string(uint32_t* length, bool validate_utf8) {
*length = consume_u32v("string length");
uint32_t offset = pc_offset();
- TRACE(" +%u %-20s: (%u bytes)\n", offset, "string", *length);
- if (validate_utf8 && !unibrow::Utf8::Validate(pc_, *length)) {
- error(pc_, "no valid UTF-8 string");
+ const byte* string_start = pc_;
+ // Consume bytes before validation to guarantee that the string is not oob.
+ consume_bytes(*length, "string");
+ if (ok() && validate_utf8 &&
+ !unibrow::Utf8::Validate(string_start, *length)) {
+ error(string_start, "no valid UTF-8 string");
}
- consume_bytes(*length);
return offset;
}
@@ -607,25 +788,134 @@ class ModuleDecoder : public Decoder {
}
uint32_t consume_func_index(WasmModule* module, WasmFunction** func) {
+ return consume_index("function index", module->functions, func);
+ }
+
+ uint32_t consume_global_index(WasmModule* module, WasmGlobal** global) {
+ return consume_index("global index", module->globals, global);
+ }
+
+ uint32_t consume_table_index(WasmModule* module,
+ WasmIndirectFunctionTable** table) {
+ return consume_index("table index", module->function_tables, table);
+ }
+
+ template <typename T>
+ uint32_t consume_index(const char* name, std::vector<T>& vector, T** ptr) {
const byte* pos = pc_;
- uint32_t func_index = consume_u32v("function index");
- if (func_index >= module->functions.size()) {
- error(pos, pos, "function index %u out of bounds (%d functions)",
- func_index, static_cast<int>(module->functions.size()));
- *func = nullptr;
+ uint32_t index = consume_u32v(name);
+ if (index >= vector.size()) {
+ error(pos, pos, "%s %u out of bounds (%d entries)", name, index,
+ static_cast<int>(vector.size()));
+ *ptr = nullptr;
return 0;
}
- *func = &module->functions[func_index];
- return func_index;
+ *ptr = &vector[index];
+ return index;
+ }
+
+ void consume_resizable_limits(const char* name, const char* units,
+ uint32_t max_value, uint32_t* initial,
+ uint32_t* maximum) {
+ uint32_t flags = consume_u32v("resizable limits flags");
+ const byte* pos = pc();
+ *initial = consume_u32v("initial size");
+ if (*initial > max_value) {
+ error(pos, pos,
+ "initial %s size (%u %s) is larger than maximum allowable (%u)",
+ name, *initial, units, max_value);
+ }
+ if (flags & 1) {
+ pos = pc();
+ *maximum = consume_u32v("maximum size");
+ if (*maximum > max_value) {
+ error(pos, pos,
+ "maximum %s size (%u %s) is larger than maximum allowable (%u)",
+ name, *maximum, units, max_value);
+ }
+ if (*maximum < *initial) {
+ error(pos, pos, "maximum %s size (%u %s) is less than initial (%u %s)",
+ name, *maximum, units, *initial, units);
+ }
+ } else {
+ *maximum = 0;
+ }
+ }
+
+ bool expect_u8(const char* name, uint8_t expected) {
+ const byte* pos = pc();
+ uint8_t value = consume_u8(name);
+ if (value != expected) {
+ error(pos, pos, "expected %s 0x%02x, got 0x%02x", name, expected, value);
+ return false;
+ }
+ return true;
+ }
+
+ WasmInitExpr consume_init_expr(WasmModule* module, LocalType expected) {
+ const byte* pos = pc();
+ uint8_t opcode = consume_u8("opcode");
+ WasmInitExpr expr;
+ unsigned len = 0;
+ switch (opcode) {
+ case kExprGetGlobal: {
+ GlobalIndexOperand operand(this, pc() - 1);
+ expr.kind = WasmInitExpr::kGlobalIndex;
+ expr.val.global_index = operand.index;
+ len = operand.length;
+ break;
+ }
+ case kExprI32Const: {
+ ImmI32Operand operand(this, pc() - 1);
+ expr.kind = WasmInitExpr::kI32Const;
+ expr.val.i32_const = operand.value;
+ len = operand.length;
+ break;
+ }
+ case kExprF32Const: {
+ ImmF32Operand operand(this, pc() - 1);
+ expr.kind = WasmInitExpr::kF32Const;
+ expr.val.f32_const = operand.value;
+ len = operand.length;
+ break;
+ }
+ case kExprI64Const: {
+ ImmI64Operand operand(this, pc() - 1);
+ expr.kind = WasmInitExpr::kI64Const;
+ expr.val.i64_const = operand.value;
+ len = operand.length;
+ break;
+ }
+ case kExprF64Const: {
+ ImmF64Operand operand(this, pc() - 1);
+ expr.kind = WasmInitExpr::kF64Const;
+ expr.val.f64_const = operand.value;
+ len = operand.length;
+ break;
+ }
+ default: {
+ error("invalid opcode in initialization expression");
+ expr.kind = WasmInitExpr::kNone;
+ expr.val.i32_const = 0;
+ }
+ }
+ consume_bytes(len, "init code");
+ if (!expect_u8("end opcode", kExprEnd)) {
+ expr.kind = WasmInitExpr::kNone;
+ }
+ if (expected != kAstStmt && TypeOf(module, expr) != kAstI32) {
+ error(pos, pos, "type error in init expression, expected %s, got %s",
+ WasmOpcodes::TypeName(expected),
+ WasmOpcodes::TypeName(TypeOf(module, expr)));
+ }
+ return expr;
}
// Reads a single 8-bit integer, interpreting it as a local type.
- LocalType consume_local_type() {
- byte val = consume_u8("local type");
+ LocalType consume_value_type() {
+ byte val = consume_u8("value type");
LocalTypeCode t = static_cast<LocalTypeCode>(val);
switch (t) {
- case kLocalVoid:
- return kAstStmt;
case kLocalI32:
return kAstI32;
case kLocalI64:
@@ -634,6 +924,8 @@ class ModuleDecoder : public Decoder {
return kAstF32;
case kLocalF64:
return kAstF64;
+ case kLocalS128:
+ return kAstS128;
default:
error(pc_ - 1, "invalid local type");
return kAstStmt;
@@ -642,19 +934,12 @@ class ModuleDecoder : public Decoder {
// Parses a type entry, which is currently limited to functions only.
FunctionSig* consume_sig() {
- const byte* pos = pc_;
- byte form = consume_u8("type form");
- if (form != kWasmFunctionTypeForm) {
- error(pos, pos, "expected function type form (0x%02x), got: 0x%02x",
- kWasmFunctionTypeForm, form);
- return nullptr;
- }
+ if (!expect_u8("type form", kWasmFunctionTypeForm)) return nullptr;
// parse parameter types
uint32_t param_count = consume_u32v("param count");
std::vector<LocalType> params;
- for (uint32_t i = 0; i < param_count; ++i) {
- LocalType param = consume_local_type();
- if (param == kAstStmt) error(pc_ - 1, "invalid void parameter type");
+ for (uint32_t i = 0; ok() && i < param_count; ++i) {
+ LocalType param = consume_value_type();
params.push_back(param);
}
@@ -667,12 +952,16 @@ class ModuleDecoder : public Decoder {
return nullptr;
}
std::vector<LocalType> returns;
- for (uint32_t i = 0; i < return_count; ++i) {
- LocalType ret = consume_local_type();
- if (ret == kAstStmt) error(pc_ - 1, "invalid void return type");
+ for (uint32_t i = 0; ok() && i < return_count; ++i) {
+ LocalType ret = consume_value_type();
returns.push_back(ret);
}
+ if (failed()) {
+ // Decoding failed, return void -> void
+ return new (module_zone) FunctionSig(0, 0, nullptr);
+ }
+
// FunctionSig stores the return types first.
LocalType* buffer =
module_zone->NewArray<LocalType>(param_count + return_count);
@@ -711,7 +1000,7 @@ class FunctionError : public FunctionResult {
};
Vector<const byte> FindSection(const byte* module_start, const byte* module_end,
- WasmSection::Code code) {
+ WasmSectionCode code) {
Decoder decoder(module_start, module_end);
uint32_t magic_word = decoder.consume_u32("wasm magic");
@@ -720,24 +1009,14 @@ Vector<const byte> FindSection(const byte* module_start, const byte* module_end,
uint32_t magic_version = decoder.consume_u32("wasm version");
if (magic_version != kWasmVersion) decoder.error("wrong wasm version");
- while (decoder.more() && decoder.ok()) {
- // Read the section name.
- uint32_t string_length = decoder.consume_u32v("section name length");
- const byte* section_name_start = decoder.pc();
- decoder.consume_bytes(string_length);
- if (decoder.failed()) break;
-
- WasmSection::Code section =
- WasmSection::lookup(section_name_start, string_length);
-
- // Read and check the section size.
- uint32_t section_length = decoder.consume_u32v("section length");
-
- const byte* section_start = decoder.pc();
- decoder.consume_bytes(section_length);
- if (section == code && decoder.ok()) {
- return Vector<const uint8_t>(section_start, section_length);
+ WasmSectionIterator section_iter(decoder);
+ while (section_iter.more()) {
+ if (section_iter.section_code() == code) {
+ return Vector<const uint8_t>(section_iter.section_start(),
+ section_iter.section_length());
}
+ decoder.consume_bytes(section_iter.section_length(), "section payload");
+ section_iter.advance();
}
return Vector<const uint8_t>();
@@ -772,6 +1051,13 @@ FunctionSig* DecodeWasmSignatureForTesting(Zone* zone, const byte* start,
return decoder.DecodeFunctionSignature(start);
}
+WasmInitExpr DecodeWasmInitExprForTesting(const byte* start, const byte* end) {
+ AccountingAllocator allocator;
+ Zone zone(&allocator);
+ ModuleDecoder decoder(&zone, start, end, kWasmOrigin);
+ return decoder.DecodeInitExpr(start);
+}
+
FunctionResult DecodeWasmFunction(Isolate* isolate, Zone* zone,
ModuleEnv* module_env,
const byte* function_start,
@@ -789,15 +1075,26 @@ FunctionResult DecodeWasmFunction(Isolate* isolate, Zone* zone,
return decoder.DecodeSingleFunction(module_env, function);
}
-FunctionOffsetsResult DecodeWasmFunctionOffsets(const byte* module_start,
- const byte* module_end) {
+FunctionOffsetsResult DecodeWasmFunctionOffsets(
+ const byte* module_start, const byte* module_end,
+ uint32_t num_imported_functions) {
+ // Find and decode the code section.
Vector<const byte> code_section =
- FindSection(module_start, module_end, WasmSection::Code::FunctionBodies);
+ FindSection(module_start, module_end, kCodeSectionCode);
Decoder decoder(code_section.start(), code_section.end());
- if (!code_section.start()) decoder.error("no code section");
+ FunctionOffsets table;
+ if (!code_section.start()) {
+ decoder.error("no code section");
+ return decoder.toResult(std::move(table));
+ }
+
+ // Reserve entries for the imported functions.
+ table.reserve(num_imported_functions);
+ for (uint32_t i = 0; i < num_imported_functions; i++) {
+ table.push_back(std::make_pair(0, 0));
+ }
uint32_t functions_count = decoder.consume_u32v("functions count");
- FunctionOffsets table;
// Take care of invalid input here.
if (functions_count < static_cast<unsigned>(code_section.length()) / 2)
table.reserve(functions_count);