char-predicates.h 2.67 KB
Newer Older
1
// Copyright 2011 the V8 project authors. All rights reserved.
2 3
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
4 5 6 7

#ifndef V8_CHAR_PREDICATES_H_
#define V8_CHAR_PREDICATES_H_

8
#include "src/globals.h"
9
#include "src/unicode.h"
10

11 12
namespace v8 {
namespace internal {
13 14 15 16

// Unicode character predicates as defined by ECMA-262, 3rd,
// used for lexical analysis.

17
inline int AsciiAlphaToLower(uc32 c);
18 19
inline bool IsCarriageReturn(uc32 c);
inline bool IsLineFeed(uc32 c);
20 21
inline bool IsAsciiIdentifier(uc32 c);
inline bool IsAlphaNumeric(uc32 c);
22 23
inline bool IsDecimalDigit(uc32 c);
inline bool IsHexDigit(uc32 c);
24 25
inline bool IsOctalDigit(uc32 c);
inline bool IsBinaryDigit(uc32 c);
26 27
inline bool IsRegExpWord(uc32 c);
inline bool IsRegExpNewline(uc32 c);
28

29
// ES#sec-names-and-keywords
30 31 32 33
// This includes '_', '$' and '\', and ID_Start according to
// http://www.unicode.org/reports/tr31/, which consists of categories
// 'Lu', 'Ll', 'Lt', 'Lm', 'Lo', 'Nl', but excluding properties
// 'Pattern_Syntax' or 'Pattern_White_Space'.
34 35 36 37
#ifdef V8_INTL_SUPPORT
struct V8_EXPORT_PRIVATE IdentifierStart {
  static bool Is(uc32 c);
#else
38
struct IdentifierStart {
39
  // Non-BMP characters are not supported without I18N.
40
  static inline bool Is(uc32 c) {
41
    return (c <= 0xFFFF) ? unibrow::ID_Start::Is(c) : false;
42
  }
43
#endif
44 45
};

46
// ES#sec-names-and-keywords
47 48 49 50
// This includes \u200c and \u200d, and ID_Continue according to
// http://www.unicode.org/reports/tr31/, which consists of ID_Start,
// the categories 'Mn', 'Mc', 'Nd', 'Pc', but excluding properties
// 'Pattern_Syntax' or 'Pattern_White_Space'.
51 52 53 54
#ifdef V8_INTL_SUPPORT
struct V8_EXPORT_PRIVATE IdentifierPart {
  static bool Is(uc32 c);
#else
55 56
struct IdentifierPart {
  static inline bool Is(uc32 c) {
57 58 59 60 61
    // Non-BMP charaacters are not supported without I18N.
    if (c <= 0xFFFF) {
      return unibrow::ID_Start::Is(c) || unibrow::ID_Continue::Is(c);
    }
    return false;
62
  }
63
#endif
64 65
};

66 67
// ES6 draft section 11.2
// This includes all code points of Unicode category 'Zs'.
68 69 70 71 72
// Further included are \u0009, \u000b, \u000c, and \ufeff.
#ifdef V8_INTL_SUPPORT
struct V8_EXPORT_PRIVATE WhiteSpace {
  static bool Is(uc32 c);
#else
73
struct WhiteSpace {
74
  static inline bool Is(uc32 c) { return unibrow::WhiteSpace::Is(c); }
75
#endif
76 77
};

78
// WhiteSpace and LineTerminator according to ES6 draft section 11.2 and 11.3
79 80
// This includes all the characters with Unicode category 'Z' (= Zs+Zl+Zp)
// as well as \u0009 - \u000d and \ufeff.
81 82
struct WhiteSpaceOrLineTerminator {
  static inline bool Is(uc32 c) {
83
    return WhiteSpace::Is(c) || unibrow::IsLineTerminator(c);
84 85 86
  }
};

87 88
}  // namespace internal
}  // namespace v8
89 90

#endif  // V8_CHAR_PREDICATES_H_