// Copyright 2006-2008 the V8 project authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. // This file contains support for URI manipulations written in // JavaScript. (function(global, utils) { "use strict"; %CheckIsBootstrapping(); //- ------------------------------------------------------------------ // Imports var GlobalObject = global.Object; var InternalArray = utils.InternalArray; var MakeURIError; utils.Import(function(from) { MakeURIError = from.MakeURIError; }); // ------------------------------------------------------------------- // Define internal helper functions. function HexValueOf(code) { // 0-9 if (code >= 48 && code <= 57) return code - 48; // A-F if (code >= 65 && code <= 70) return code - 55; // a-f if (code >= 97 && code <= 102) return code - 87; return -1; } function URIHexCharsToCharCode(highChar, lowChar) { var highCode = HexValueOf(highChar); var lowCode = HexValueOf(lowChar); if (highCode == -1 || lowCode == -1) throw MakeURIError(); return (highCode << 4) | lowCode; } // Callers must ensure that |result| is a sufficiently long sequential // two-byte string! function URIDecodeOctets(octets, result, index) { var value; var o0 = octets[0]; if (o0 < 0x80) { value = o0; } else if (o0 < 0xc2) { throw MakeURIError(); } else { var o1 = octets[1]; if (o0 < 0xe0) { var a = o0 & 0x1f; if ((o1 < 0x80) || (o1 > 0xbf)) throw MakeURIError(); var b = o1 & 0x3f; value = (a << 6) + b; if (value < 0x80 || value > 0x7ff) throw MakeURIError(); } else { var o2 = octets[2]; if (o0 < 0xf0) { var a = o0 & 0x0f; if ((o1 < 0x80) || (o1 > 0xbf)) throw MakeURIError(); var b = o1 & 0x3f; if ((o2 < 0x80) || (o2 > 0xbf)) throw MakeURIError(); var c = o2 & 0x3f; value = (a << 12) + (b << 6) + c; if ((value < 0x800) || (value > 0xffff)) throw MakeURIError(); } else { var o3 = octets[3]; if (o0 < 0xf8) { var a = (o0 & 0x07); if ((o1 < 0x80) || (o1 > 0xbf)) throw MakeURIError(); var b = (o1 & 0x3f); if ((o2 < 0x80) || (o2 > 0xbf)) { throw MakeURIError(); } var c = (o2 & 0x3f); if ((o3 < 0x80) || (o3 > 0xbf)) throw MakeURIError(); var d = (o3 & 0x3f); value = (a << 18) + (b << 12) + (c << 6) + d; if ((value < 0x10000) || (value > 0x10ffff)) throw MakeURIError(); } else { throw MakeURIError(); } } } } if (0xD800 <= value && value <= 0xDFFF) throw MakeURIError(); if (value < 0x10000) { %_TwoByteSeqStringSetChar(index++, value, result); } else { %_TwoByteSeqStringSetChar(index++, (value >> 10) + 0xd7c0, result); %_TwoByteSeqStringSetChar(index++, (value & 0x3ff) + 0xdc00, result); } return index; } // ECMA-262, section 15.1.3 function Decode(uri, reserved) { uri = TO_STRING(uri); var uriLength = uri.length; var one_byte = %NewString(uriLength, NEW_ONE_BYTE_STRING); var index = 0; var k = 0; // Optimistically assume one-byte string. for ( ; k < uriLength; k++) { var code = %_StringCharCodeAt(uri, k); if (code == 37) { // '%' if (k + 2 >= uriLength) throw MakeURIError(); var cc = URIHexCharsToCharCode(%_StringCharCodeAt(uri, k+1), %_StringCharCodeAt(uri, k+2)); if (cc >> 7) break; // Assumption wrong, two-byte string. if (reserved(cc)) { %_OneByteSeqStringSetChar(index++, 37, one_byte); // '%'. %_OneByteSeqStringSetChar(index++, %_StringCharCodeAt(uri, k+1), one_byte); %_OneByteSeqStringSetChar(index++, %_StringCharCodeAt(uri, k+2), one_byte); } else { %_OneByteSeqStringSetChar(index++, cc, one_byte); } k += 2; } else { if (code > 0x7f) break; // Assumption wrong, two-byte string. %_OneByteSeqStringSetChar(index++, code, one_byte); } } one_byte = %TruncateString(one_byte, index); if (k == uriLength) return one_byte; // Write into two byte string. var two_byte = %NewString(uriLength - k, NEW_TWO_BYTE_STRING); index = 0; for ( ; k < uriLength; k++) { var code = %_StringCharCodeAt(uri, k); if (code == 37) { // '%' if (k + 2 >= uriLength) throw MakeURIError(); var cc = URIHexCharsToCharCode(%_StringCharCodeAt(uri, ++k), %_StringCharCodeAt(uri, ++k)); if (cc >> 7) { var n = 0; while (((cc << ++n) & 0x80) != 0) { } if (n == 1 || n > 4) throw MakeURIError(); var octets = new InternalArray(n); octets[0] = cc; if (k + 3 * (n - 1) >= uriLength) throw MakeURIError(); for (var i = 1; i < n; i++) { if (uri[++k] != '%') throw MakeURIError(); octets[i] = URIHexCharsToCharCode(%_StringCharCodeAt(uri, ++k), %_StringCharCodeAt(uri, ++k)); } index = URIDecodeOctets(octets, two_byte, index); } else if (reserved(cc)) { %_TwoByteSeqStringSetChar(index++, 37, two_byte); // '%'. %_TwoByteSeqStringSetChar(index++, %_StringCharCodeAt(uri, k - 1), two_byte); %_TwoByteSeqStringSetChar(index++, %_StringCharCodeAt(uri, k), two_byte); } else { %_TwoByteSeqStringSetChar(index++, cc, two_byte); } } else { %_TwoByteSeqStringSetChar(index++, code, two_byte); } } two_byte = %TruncateString(two_byte, index); return one_byte + two_byte; } // ------------------------------------------------------------------- // Define exported functions. // ECMA-262 - B.2.1. function URIEscapeJS(s) { return %URIEscape(s); } // ECMA-262 - B.2.2. function URIUnescapeJS(s) { return %URIUnescape(s); } // ECMA-262 - 15.1.3.1. function URIDecode(uri) { var reservedPredicate = function(cc) { // #$ if (35 <= cc && cc <= 36) return true; // & if (cc == 38) return true; // +, if (43 <= cc && cc <= 44) return true; // / if (cc == 47) return true; // :; if (58 <= cc && cc <= 59) return true; // = if (cc == 61) return true; // ?@ if (63 <= cc && cc <= 64) return true; return false; }; return Decode(uri, reservedPredicate); } // ECMA-262 - 15.1.3.2. function URIDecodeComponent(component) { var reservedPredicate = function(cc) { return false; }; return Decode(component, reservedPredicate); } // ------------------------------------------------------------------- // Install exported functions. // Set up non-enumerable URI functions on the global object and set // their names. utils.InstallFunctions(global, DONT_ENUM, [ "escape", URIEscapeJS, "unescape", URIUnescapeJS, "decodeURI", URIDecode, "decodeURIComponent", URIDecodeComponent ]); })