Implemented invalid UTF8 detection in decodeURI. That is, detection

of invalid utf8 not invalid utf8-detection.


git-svn-id: http://v8.googlecode.com/svn/branches/bleeding_edge@1471 ce2b1a6d-e550-0410-aec6-3dcde31c8c00
parent 5718547a
...@@ -302,10 +302,6 @@ function SetupRegExp() { ...@@ -302,10 +302,6 @@ function SetupRegExp() {
"compile", CompileRegExp "compile", CompileRegExp
)); ));
// The spec says nothing about the length of exec and test, but
// SpiderMonkey and KJS have length equal to 0.
%FunctionSetLength($RegExp.prototype.exec, 0);
%FunctionSetLength($RegExp.prototype.test, 0);
// The length of compile is 1 in SpiderMonkey. // The length of compile is 1 in SpiderMonkey.
%FunctionSetLength($RegExp.prototype.compile, 1); %FunctionSetLength($RegExp.prototype.compile, 1);
......
...@@ -90,27 +90,65 @@ function URIHexCharsToCharCode(ch1, ch2) { ...@@ -90,27 +90,65 @@ function URIHexCharsToCharCode(ch1, ch2) {
function URIDecodeOctets(octets, result, index) { function URIDecodeOctets(octets, result, index) {
if (octets[3]) { var value;
var x = (octets[2] >> 4) & 3; var o0 = octets[0];
var y = octets[2] & 0xF; if (o0 < 0x80) {
var z = octets[3] & 63; value = o0;
var v = (((octets[0] & 7) << 2) | ((octets[1] >> 4) & 3)) - 1; } else if (o0 < 0xc2) {
var w = octets[1] & 0xF; throw new $URIError("URI malformed");
result[index++] = 55296 | (v << 6) | (w << 2) | x; } else {
result[index++] = 56320 | (y << 6) | z; var o1 = octets[1];
return index; if (o0 < 0xe0) {
var a = o0 & 0x1f;
if ((o1 < 0x80) || (o1 > 0xbf))
throw new $URIError("URI malformed");
var b = o1 & 0x3f;
value = (a << 6) + b;
if (value < 0x80 || value > 0x7ff)
throw new $URIError("URI malformed");
} else {
var o2 = octets[2];
if (o0 < 0xf0) {
var a = o0 & 0x0f;
if ((o1 < 0x80) || (o1 > 0xbf))
throw new $URIError("URI malformed");
var b = o1 & 0x3f;
if ((o2 < 0x80) || (o2 > 0xbf))
throw new $URIError("URI malformed");
var c = o2 & 0x3f;
value = (a << 12) + (b << 6) + c;
if ((value < 0x800) || (value > 0xffff))
throw new $URIError("URI malformed");
} else {
var o3 = octets[3];
if (o0 < 0xf8) {
var a = (o0 & 0x07);
if ((o1 < 0x80) || (o1 > 0xbf))
throw new $URIError("URI malformed");
var b = (o1 & 0x3f);
if ((o2 < 0x80) || (o2 > 0xbf))
throw new $URIError("URI malformed");
var c = (o2 & 0x3f);
if ((o3 < 0x80) || (o3 > 0xbf))
throw new $URIError("URI malformed");
var d = (o3 & 0x3f);
value = (a << 18) + (b << 12) + (c << 6) + d;
if ((value < 0x10000) || (value > 0x10ffff))
throw new $URIError("URI malformed");
} else {
throw new $URIError("URI malformed");
}
}
}
} }
if (octets[2]) { if (value < 0x10000) {
var x = octets[0] & 0xF; result[index++] = value;
var y = octets[1] & 63; return index;
var z = octets[2] & 63; } else {
result[index++] = (x << 12) | (y << 6) | z; result[index++] = (value >> 10) + 0xd7c0;
result[index++] = (value & 0x3ff) + 0xdc00;
return index; return index;
} }
var z = octets[1] & 63;
var y = octets[0] & 31;
result[index++] = (y << 6) | z;
return index;
} }
......
// Copyright 2009 the V8 project authors. All rights reserved.
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
// * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
// * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following
// disclaimer in the documentation and/or other materials provided
// with the distribution.
// * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived
// from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
var kLegalPairs = [
[0x00, '%00'],
[0x01, '%01'],
[0x7f, '%7F'],
[0x80, '%C2%80'],
[0x81, '%C2%81'],
[0x7ff, '%DF%BF'],
[0x800, '%E0%A0%80'],
[0x801, '%E0%A0%81'],
[0xd7ff, '%ED%9F%BF'],
[0xffff, '%EF%BF%BF']
];
var kIllegalEncoded = [
'%80', '%BF', '%80%BF', '%80%BF%80', '%C0%22', '%DF',
'%EF%BF', '%F7BFBF', '%FE', '%FF', '%FE%FE%FF%FF',
'%C0%AF', '%E0%9F%BF', '%F0%8F%BF%BF', '%C0%80',
'%E0%80%80'
];
function run() {
for (var i = 0; i < kLegalPairs.length; i++) {
var decoded = String.fromCharCode(kLegalPairs[i][0]);
var encoded = kLegalPairs[i][1];
assertEquals(decodeURI(encoded), decoded);
assertEquals(encodeURI(decoded), encoded);
}
for (var i = 0; i < kIllegalEncoded.length; i++) {
var value = kIllegalEncoded[i];
var threw = false;
try {
decodeURI(value);
fail(value);
} catch (e) {
assertInstanceof(e, URIError);
}
}
}
run();
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment