Index: test/mjsunit/wasm/unicode-validation.js |
diff --git a/test/mjsunit/wasm/unicode-validation.js b/test/mjsunit/wasm/unicode-validation.js |
new file mode 100644 |
index 0000000000000000000000000000000000000000..b2e46030877ccd1223de013cafe83d73a1d7babb |
--- /dev/null |
+++ b/test/mjsunit/wasm/unicode-validation.js |
@@ -0,0 +1,121 @@ |
+// Copyright 2016 the V8 project authors. All rights reserved. |
+// Use of this source code is governed by a BSD-style license that can be |
+// found in the LICENSE file. |
+ |
+// Flags: --expose-wasm |
+ |
+load("test/mjsunit/wasm/wasm-constants.js"); |
+load("test/mjsunit/wasm/wasm-module-builder.js"); |
+ |
+function toByteArray(s) { |
+ var arr = []; |
+ for (var i = 0; i < s.length; ++i) { |
+ arr.push(s.charCodeAt(i) & 0xff); |
+ } |
+ return arr; |
+} |
+ |
+function toString(arr) { |
+ if (typeof arr === "string") return arr; |
+ var s = ""; |
+ for (var b of arr) s += String.fromCharCode(b); |
+ return s; |
+} |
+ |
+function toUTF8(arr) { |
+ if (typeof arr === "string" || arr === undefined) return arr; |
+ return decodeURIComponent(escape(toString(arr))); |
+} |
+ |
+function isValidUtf8(arr) { |
+ if (typeof arr === "string" || arr === undefined) return true; |
+ try { |
+ var s = toUTF8(arr); |
+ for (var i = 0; i < s.length; ++i) |
+ if ((s.charCodeAt(i) & 0xfffe) == 0xfffe) |
+ return false; |
+ return true; |
+ } catch (e) { |
+ if (e instanceof URIError) return false; |
+ throw e; |
+ } |
+} |
+ |
+function checkImportsAndExports(imported_module_name, imported_function_name, |
+ internal_function_name, exported_function_name, shouldThrow) { |
+ var builder = new WasmModuleBuilder(); |
+ |
+ builder.addImportWithModule(imported_module_name, imported_function_name, |
+ kSig_v_v); |
+ |
+ builder.addFunction(internal_function_name, kSig_v_v) |
+ .addBody([kExprCallImport, kArity0, 0]) |
+ .exportAs(exported_function_name); |
+ |
+ // sanity check: does javascript agree with out shouldThrow annotation? |
+ assertEquals(shouldThrow, |
+ !isValidUtf8(imported_module_name) || |
+ !isValidUtf8(imported_function_name) || |
+ !isValidUtf8(exported_function_name), |
+ "JavaScript does not agree with our shouldThrow expectation"); |
+ |
+ if (!shouldThrow) { |
+ imported_module_name = toUTF8(imported_module_name); |
+ imported_function_name = toUTF8(imported_function_name); |
+ } |
+ |
+ var ffi = new Object(); |
+ if (imported_function_name === undefined) { |
+ ffi[imported_module_name] = function() { }; |
+ } else { |
+ ffi[imported_module_name] = new Object(); |
+ ffi[imported_module_name][imported_function_name] = function() { }; |
+ } |
+ |
+ var hasThrown = true; |
+ try { |
+ builder.instantiate(ffi); |
+ hasThrown = false; |
+ } catch (err) { |
+ if (!shouldThrow) print(err); |
+ assertTrue(shouldThrow, "Should not throw error on valid names"); |
+ assertContains("UTF-8", err.toString()); |
+ } |
+ assertEquals(shouldThrow, hasThrown, |
+ "Should throw validation error on invalid names"); |
+} |
+ |
+function checkImportedModuleName(name, shouldThrow) { |
+ checkImportsAndExports(name, "imp", "func", undefined, shouldThrow); |
+} |
+ |
+function checkImportedFunctionName(name, shouldThrow) { |
+ checkImportsAndExports("module", name, "func", "func", shouldThrow); |
+} |
+ |
+function checkExportedFunctionName(name, shouldThrow) { |
+ checkImportsAndExports("module", "func", "func", name, shouldThrow); |
+} |
+ |
+function checkInternalFunctionName(name) { |
+ checkImportsAndExports("module", "func", name, "func", false); |
+} |
+ |
+function checkAll(name, shouldThrow) { |
+ checkImportedModuleName(name, shouldThrow); |
+ checkImportedFunctionName(name, shouldThrow); |
+ checkExportedFunctionName(name, shouldThrow); |
+ checkInternalFunctionName(name); |
+} |
+ |
+checkAll("ascii", false); |
+checkAll("some math: (½)² = ¼", false); |
+checkAll("中国历史系列条目\n北", false); |
+checkAll(toByteArray("\xef\xb7\x8f"), false); |
+checkAll(toByteArray("a\xc2\x81\xe1\x80\xbf\xf1\x80\xa0\xbf"), false); |
+checkAll(toByteArray("\xff"), true); |
+checkAll(toByteArray("\xed\xa0\x8f"), true); // surrogate code points |
+checkAll(toByteArray("\xe0\x82\x80"), true); // overlong sequence |
+checkAll(toByteArray("\xf4\x90\x80\x80"), true); // beyond limit: U+110000 |
+checkAll(toByteArray("\xef\xbf\xbe"), true); // non-character; U+FFFE |
+checkAll(toByteArray("with\x00null"), false); |