#include "builtin/String.h"
#include "mozilla/ArrayUtils.h"
#include "mozilla/Attributes.h"
#include "mozilla/CheckedInt.h"
#include "mozilla/FloatingPoint.h"
#include "mozilla/PodOperations.h"
#include "mozilla/Range.h"
#include "mozilla/TypeTraits.h"
#include "mozilla/Unused.h"
#include <ctype.h>
#include <limits>
#include <string.h>
#include "jsapi.h"
#include "jsnum.h"
#include "jstypes.h"
#include "jsutil.h"
#include "builtin/Array.h"
#include "builtin/Boolean.h"
#include "builtin/intl/CommonFunctions.h"
#include "builtin/intl/ICUStubs.h"
#include "builtin/RegExp.h"
#include "jit/InlinableNatives.h"
#include "js/Conversions.h"
#if !EXPOSE_INTL_API
# include "js/LocaleSensitive.h"
#endif
#include "js/PropertySpec.h"
#include "js/StableStringChars.h"
#include "js/UniquePtr.h"
#if ENABLE_INTL_API
# include "unicode/uchar.h"
# include "unicode/unorm2.h"
#endif
#include "util/StringBuffer.h"
#include "util/Unicode.h"
#include "vm/BytecodeUtil.h"
#include "vm/GlobalObject.h"
#include "vm/Interpreter.h"
#include "vm/JSAtom.h"
#include "vm/JSContext.h"
#include "vm/JSObject.h"
#include "vm/Opcodes.h"
#include "vm/Printer.h"
#include "vm/RegExpObject.h"
#include "vm/RegExpStatics.h"
#include "vm/SelfHosting.h"
#include "vm/InlineCharBuffer-inl.h"
#include "vm/Interpreter-inl.h"
#include "vm/StringObject-inl.h"
#include "vm/StringType-inl.h"
#include "vm/TypeInference-inl.h"
using namespace js;
using JS::Symbol;
using JS::SymbolCode;
using mozilla::CheckedInt;
using mozilla::IsNaN;
using mozilla::IsSame;
using mozilla::PodCopy;
using mozilla::RangedPtr;
using JS::AutoCheckCannotGC;
using JS::AutoStableStringChars;
static JSLinearString* ArgToLinearString(JSContext* cx, const CallArgs& args,
unsigned argno) {
if (argno >= args.length()) {
return cx->names().undefined;
}
JSString* str = ToString<CanGC>(cx, args[argno]);
if (!str) {
return nullptr;
}
return str->ensureLinear(cx);
}
static bool str_decodeURI(JSContext* cx, unsigned argc, Value* vp);
static bool str_decodeURI_Component(JSContext* cx, unsigned argc, Value* vp);
static bool str_encodeURI(JSContext* cx, unsigned argc, Value* vp);
static bool str_encodeURI_Component(JSContext* cx, unsigned argc, Value* vp);
template <typename CharT>
static bool Escape(JSContext* cx, const CharT* chars, uint32_t length,
InlineCharBuffer<Latin1Char>& newChars,
uint32_t* newLengthOut) {
static const uint8_t shouldPassThrough[128] = {
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,0,0,1,1,0,1,1,1,
1,1,1,1,1,1,1,1,1,1,0,0,0,0,0,0,
1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
1,1,1,1,1,1,1,1,1,1,1,0,0,0,0,1,
0,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,
1,1,1,1,1,1,1,1,1,1,1,0,0,0,0,0,
};
uint32_t newLength = length;
for (size_t i = 0; i < length; i++) {
char16_t ch = chars[i];
if (ch < 128 && shouldPassThrough[ch]) {
continue;
}
static_assert(JSString::MAX_LENGTH < UINT32_MAX - 5,
"Adding 5 to valid string length should not overflow");
MOZ_ASSERT(newLength <= JSString::MAX_LENGTH);
newLength += (ch < 256) ? 2 : 5;
if (MOZ_UNLIKELY(newLength > JSString::MAX_LENGTH)) {
ReportAllocationOverflow(cx);
return false;
}
}
if (newLength == length) {
*newLengthOut = newLength;
return true;
}
if (!newChars.maybeAlloc(cx, newLength)) {
return false;
}
static const char digits[] = "0123456789ABCDEF";
Latin1Char* rawNewChars = newChars.get();
size_t i, ni;
for (i = 0, ni = 0; i < length; i++) {
char16_t ch = chars[i];
if (ch < 128 && shouldPassThrough[ch]) {
rawNewChars[ni++] = ch;
} else if (ch < 256) {
rawNewChars[ni++] = '%';
rawNewChars[ni++] = digits[ch >> 4];
rawNewChars[ni++] = digits[ch & 0xF];
} else {
rawNewChars[ni++] = '%';
rawNewChars[ni++] = 'u';
rawNewChars[ni++] = digits[ch >> 12];
rawNewChars[ni++] = digits[(ch & 0xF00) >> 8];
rawNewChars[ni++] = digits[(ch & 0xF0) >> 4];
rawNewChars[ni++] = digits[ch & 0xF];
}
}
MOZ_ASSERT(ni == newLength);
*newLengthOut = newLength;
return true;
}
static bool str_escape(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedLinearString str(cx, ArgToLinearString(cx, args, 0));
if (!str) {
return false;
}
InlineCharBuffer<Latin1Char> newChars;
uint32_t newLength = 0; if (str->hasLatin1Chars()) {
AutoCheckCannotGC nogc;
if (!Escape(cx, str->latin1Chars(nogc), str->length(), newChars,
&newLength)) {
return false;
}
} else {
AutoCheckCannotGC nogc;
if (!Escape(cx, str->twoByteChars(nogc), str->length(), newChars,
&newLength)) {
return false;
}
}
if (newLength == str->length()) {
args.rval().setString(str);
return true;
}
JSString* res = newChars.toString(cx, newLength);
if (!res) {
return false;
}
args.rval().setString(res);
return true;
}
template <typename CharT>
static inline bool Unhex4(const RangedPtr<const CharT> chars,
char16_t* result) {
char16_t a = chars[0], b = chars[1], c = chars[2], d = chars[3];
if (!(JS7_ISHEX(a) && JS7_ISHEX(b) && JS7_ISHEX(c) && JS7_ISHEX(d))) {
return false;
}
*result =
(((((JS7_UNHEX(a) << 4) + JS7_UNHEX(b)) << 4) + JS7_UNHEX(c)) << 4) +
JS7_UNHEX(d);
return true;
}
template <typename CharT>
static inline bool Unhex2(const RangedPtr<const CharT> chars,
char16_t* result) {
char16_t a = chars[0], b = chars[1];
if (!(JS7_ISHEX(a) && JS7_ISHEX(b))) {
return false;
}
*result = (JS7_UNHEX(a) << 4) + JS7_UNHEX(b);
return true;
}
template <typename CharT>
static bool Unescape(StringBuffer& sb,
const mozilla::Range<const CharT> chars) {
uint32_t length = chars.length();
bool building = false;
#define ENSURE_BUILDING \
do { \
if (!building) { \
building = true; \
if (!sb.reserve(length)) return false; \
sb.infallibleAppend(chars.begin().get(), k); \
} \
} while (false);
uint32_t k = 0;
while (k < length) {
char16_t c = chars[k];
if (c == '%') {
static_assert(JSString::MAX_LENGTH < UINT32_MAX - 6,
"String length is not near UINT32_MAX");
if (k + 6 <= length && chars[k + 1] == 'u') {
if (Unhex4(chars.begin() + k + 2, &c)) {
ENSURE_BUILDING
k += 5;
}
} else if (k + 3 <= length) {
if (Unhex2(chars.begin() + k + 1, &c)) {
ENSURE_BUILDING
k += 2;
}
}
}
if (building && !sb.append(c)) {
return false;
}
k += 1;
}
return true;
#undef ENSURE_BUILDING
}
static bool str_unescape(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedLinearString str(cx, ArgToLinearString(cx, args, 0));
if (!str) {
return false;
}
StringBuffer sb(cx);
if (str->hasTwoByteChars() && !sb.ensureTwoByteChars()) {
return false;
}
if (str->hasLatin1Chars()) {
AutoCheckCannotGC nogc;
if (!Unescape(sb, str->latin1Range(nogc))) {
return false;
}
} else {
AutoCheckCannotGC nogc;
if (!Unescape(sb, str->twoByteRange(nogc))) {
return false;
}
}
JSLinearString* result;
if (!sb.empty()) {
result = sb.finishString();
if (!result) {
return false;
}
} else {
result = str;
}
args.rval().setString(result);
return true;
}
static bool str_uneval(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
JSString* str = ValueToSource(cx, args.get(0));
if (!str) {
return false;
}
args.rval().setString(str);
return true;
}
static const JSFunctionSpec string_functions[] = {
JS_FN(js_escape_str, str_escape, 1, JSPROP_RESOLVING),
JS_FN(js_unescape_str, str_unescape, 1, JSPROP_RESOLVING),
JS_FN(js_uneval_str, str_uneval, 1, JSPROP_RESOLVING),
JS_FN(js_decodeURI_str, str_decodeURI, 1, JSPROP_RESOLVING),
JS_FN(js_encodeURI_str, str_encodeURI, 1, JSPROP_RESOLVING),
JS_FN(js_decodeURIComponent_str, str_decodeURI_Component, 1,
JSPROP_RESOLVING),
JS_FN(js_encodeURIComponent_str, str_encodeURI_Component, 1,
JSPROP_RESOLVING),
JS_FS_END};
static const unsigned STRING_ELEMENT_ATTRS =
JSPROP_ENUMERATE | JSPROP_READONLY | JSPROP_PERMANENT;
static bool str_enumerate(JSContext* cx, HandleObject obj) {
RootedString str(cx, obj->as<StringObject>().unbox());
js::StaticStrings& staticStrings = cx->staticStrings();
RootedValue value(cx);
for (size_t i = 0, length = str->length(); i < length; i++) {
JSString* str1 = staticStrings.getUnitStringForElement(cx, str, i);
if (!str1) {
return false;
}
value.setString(str1);
if (!DefineDataElement(cx, obj, i, value,
STRING_ELEMENT_ATTRS | JSPROP_RESOLVING)) {
return false;
}
}
return true;
}
static bool str_mayResolve(const JSAtomState&, jsid id, JSObject*) {
return JSID_IS_INT(id);
}
static bool str_resolve(JSContext* cx, HandleObject obj, HandleId id,
bool* resolvedp) {
if (!JSID_IS_INT(id)) {
return true;
}
RootedString str(cx, obj->as<StringObject>().unbox());
int32_t slot = JSID_TO_INT(id);
if ((size_t)slot < str->length()) {
JSString* str1 =
cx->staticStrings().getUnitStringForElement(cx, str, size_t(slot));
if (!str1) {
return false;
}
RootedValue value(cx, StringValue(str1));
if (!DefineDataElement(cx, obj, uint32_t(slot), value,
STRING_ELEMENT_ATTRS | JSPROP_RESOLVING)) {
return false;
}
*resolvedp = true;
}
return true;
}
static const ClassOps StringObjectClassOps = {
nullptr,
nullptr,
str_enumerate, nullptr,
str_resolve, str_mayResolve};
const Class StringObject::class_ = {
js_String_str,
JSCLASS_HAS_RESERVED_SLOTS(StringObject::RESERVED_SLOTS) |
JSCLASS_HAS_CACHED_PROTO(JSProto_String),
&StringObjectClassOps};
static MOZ_ALWAYS_INLINE JSString* ToStringForStringFunction(
JSContext* cx, HandleValue thisv) {
if (!CheckRecursionLimit(cx)) {
return nullptr;
}
if (thisv.isString()) {
return thisv.toString();
}
if (thisv.isObject()) {
RootedObject obj(cx, &thisv.toObject());
if (obj->is<StringObject>()) {
StringObject* nobj = &obj->as<StringObject>();
if (HasNoToPrimitiveMethodPure(nobj, cx) &&
HasNativeMethodPure(nobj, cx->names().toString, str_toString, cx)) {
return nobj->unbox();
}
}
} else if (thisv.isNullOrUndefined()) {
JS_ReportErrorNumberASCII(cx, GetErrorMessage, nullptr,
JSMSG_CANT_CONVERT_TO,
thisv.isNull() ? "null" : "undefined", "object");
return nullptr;
}
return ToStringSlow<CanGC>(cx, thisv);
}
MOZ_ALWAYS_INLINE bool IsString(HandleValue v) {
return v.isString() || (v.isObject() && v.toObject().is<StringObject>());
}
MOZ_ALWAYS_INLINE bool str_toSource_impl(JSContext* cx, const CallArgs& args) {
MOZ_ASSERT(IsString(args.thisv()));
JSString* str = ToString<CanGC>(cx, args.thisv());
if (!str) {
return false;
}
UniqueChars quoted = QuoteString(cx, str, '"');
if (!quoted) {
return false;
}
StringBuffer sb(cx);
if (!sb.append("(new String(") ||
!sb.append(quoted.get(), strlen(quoted.get())) || !sb.append("))")) {
return false;
}
JSString* result = sb.finishString();
if (!result) {
return false;
}
args.rval().setString(result);
return true;
}
static bool str_toSource(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
return CallNonGenericMethod<IsString, str_toSource_impl>(cx, args);
}
MOZ_ALWAYS_INLINE bool str_toString_impl(JSContext* cx, const CallArgs& args) {
MOZ_ASSERT(IsString(args.thisv()));
args.rval().setString(
args.thisv().isString()
? args.thisv().toString()
: args.thisv().toObject().as<StringObject>().unbox());
return true;
}
bool js::str_toString(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
return CallNonGenericMethod<IsString, str_toString_impl>(cx, args);
}
JSString* js::SubstringKernel(JSContext* cx, HandleString str, int32_t beginInt,
int32_t lengthInt) {
MOZ_ASSERT(0 <= beginInt);
MOZ_ASSERT(0 <= lengthInt);
MOZ_ASSERT(uint32_t(beginInt) <= str->length());
MOZ_ASSERT(uint32_t(lengthInt) <= str->length() - beginInt);
uint32_t begin = beginInt;
uint32_t len = lengthInt;
if (str->isRope()) {
JSRope* rope = &str->asRope();
if (begin + len <= rope->leftChild()->length()) {
return NewDependentString(cx, rope->leftChild(), begin, len);
}
if (begin >= rope->leftChild()->length()) {
begin -= rope->leftChild()->length();
return NewDependentString(cx, rope->rightChild(), begin, len);
}
MOZ_ASSERT(begin < rope->leftChild()->length() &&
begin + len > rope->leftChild()->length());
size_t lhsLength = rope->leftChild()->length() - begin;
size_t rhsLength = begin + len - rope->leftChild()->length();
Rooted<JSRope*> ropeRoot(cx, rope);
RootedString lhs(
cx, NewDependentString(cx, ropeRoot->leftChild(), begin, lhsLength));
if (!lhs) {
return nullptr;
}
RootedString rhs(
cx, NewDependentString(cx, ropeRoot->rightChild(), 0, rhsLength));
if (!rhs) {
return nullptr;
}
return JSRope::new_<CanGC>(cx, lhs, rhs, len);
}
return NewDependentString(cx, str, begin, len);
}
static char16_t Final_Sigma(const char16_t* chars, size_t length,
size_t index) {
MOZ_ASSERT(index < length);
MOZ_ASSERT(chars[index] == unicode::GREEK_CAPITAL_LETTER_SIGMA);
MOZ_ASSERT(unicode::ToLowerCase(unicode::GREEK_CAPITAL_LETTER_SIGMA) ==
unicode::GREEK_SMALL_LETTER_SIGMA);
#if ENABLE_INTL_API
JS::AutoSuppressGCAnalysis nogc;
bool precededByCased = false;
for (size_t i = index; i > 0;) {
char16_t c = chars[--i];
uint32_t codePoint = c;
if (unicode::IsTrailSurrogate(c) && i > 0) {
char16_t lead = chars[i - 1];
if (unicode::IsLeadSurrogate(lead)) {
codePoint = unicode::UTF16Decode(lead, c);
i--;
}
}
if (u_hasBinaryProperty(codePoint, UCHAR_CASE_IGNORABLE)) {
continue;
}
precededByCased = u_hasBinaryProperty(codePoint, UCHAR_CASED);
break;
}
if (!precededByCased) {
return unicode::GREEK_SMALL_LETTER_SIGMA;
}
bool followedByCased = false;
for (size_t i = index + 1; i < length;) {
char16_t c = chars[i++];
uint32_t codePoint = c;
if (unicode::IsLeadSurrogate(c) && i < length) {
char16_t trail = chars[i];
if (unicode::IsTrailSurrogate(trail)) {
codePoint = unicode::UTF16Decode(c, trail);
i++;
}
}
if (u_hasBinaryProperty(codePoint, UCHAR_CASE_IGNORABLE)) {
continue;
}
followedByCased = u_hasBinaryProperty(codePoint, UCHAR_CASED);
break;
}
if (!followedByCased) {
return unicode::GREEK_SMALL_LETTER_FINAL_SIGMA;
}
#endif
return unicode::GREEK_SMALL_LETTER_SIGMA;
}
static Latin1Char Final_Sigma(const Latin1Char* chars, size_t length,
size_t index) {
MOZ_ASSERT_UNREACHABLE("U+03A3 is not a Latin-1 character");
return 0;
}
template <typename CharT>
static size_t ToLowerCaseImpl(CharT* destChars, const CharT* srcChars,
size_t startIndex, size_t srcLength,
size_t destLength) {
MOZ_ASSERT(startIndex < srcLength);
MOZ_ASSERT(srcLength <= destLength);
MOZ_ASSERT_IF((IsSame<CharT, Latin1Char>::value), srcLength == destLength);
size_t j = startIndex;
for (size_t i = startIndex; i < srcLength; i++) {
char16_t c = srcChars[i];
if (!IsSame<CharT, Latin1Char>::value) {
if (unicode::IsLeadSurrogate(c) && i + 1 < srcLength) {
char16_t trail = srcChars[i + 1];
if (unicode::IsTrailSurrogate(trail)) {
trail = unicode::ToLowerCaseNonBMPTrail(c, trail);
destChars[j++] = c;
destChars[j++] = trail;
i++;
continue;
}
}
if (c == unicode::LATIN_CAPITAL_LETTER_I_WITH_DOT_ABOVE) {
if (srcLength == destLength) {
return i;
}
destChars[j++] = CharT('i');
destChars[j++] = CharT(unicode::COMBINING_DOT_ABOVE);
continue;
}
if (c == unicode::GREEK_CAPITAL_LETTER_SIGMA) {
destChars[j++] = Final_Sigma(srcChars, srcLength, i);
continue;
}
}
c = unicode::ToLowerCase(c);
MOZ_ASSERT_IF((IsSame<CharT, Latin1Char>::value),
c <= JSString::MAX_LATIN1_CHAR);
destChars[j++] = c;
}
MOZ_ASSERT(j == destLength);
return srcLength;
}
static size_t ToLowerCaseLength(const char16_t* chars, size_t startIndex,
size_t length) {
size_t lowerLength = length;
for (size_t i = startIndex; i < length; i++) {
char16_t c = chars[i];
if (c == unicode::LATIN_CAPITAL_LETTER_I_WITH_DOT_ABOVE) {
lowerLength += 1;
}
}
return lowerLength;
}
static size_t ToLowerCaseLength(const Latin1Char* chars, size_t startIndex,
size_t length) {
MOZ_ASSERT_UNREACHABLE("never called for Latin-1 strings");
return 0;
}
template <typename CharT>
static JSString* ToLowerCase(JSContext* cx, JSLinearString* str) {
InlineCharBuffer<CharT> newChars;
const size_t length = str->length();
size_t resultLength;
{
AutoCheckCannotGC nogc;
const CharT* chars = str->chars<CharT>(nogc);
MOZ_ASSERT(unicode::ChangesWhenLowerCased(
unicode::LATIN_CAPITAL_LETTER_I_WITH_DOT_ABOVE),
"U+0130 has a simple lower case mapping");
MOZ_ASSERT(
unicode::ChangesWhenLowerCased(unicode::GREEK_CAPITAL_LETTER_SIGMA),
"U+03A3 has a simple lower case mapping");
if (IsSame<CharT, Latin1Char>::value) {
if (length == 1) {
char16_t lower = unicode::ToLowerCase(chars[0]);
MOZ_ASSERT(lower <= JSString::MAX_LATIN1_CHAR);
MOZ_ASSERT(StaticStrings::hasUnit(lower));
return cx->staticStrings().getUnit(lower);
}
}
size_t i = 0;
for (; i < length; i++) {
CharT c = chars[i];
if (!IsSame<CharT, Latin1Char>::value) {
if (unicode::IsLeadSurrogate(c) && i + 1 < length) {
CharT trail = chars[i + 1];
if (unicode::IsTrailSurrogate(trail)) {
if (unicode::ChangesWhenLowerCasedNonBMP(c, trail)) {
break;
}
i++;
continue;
}
}
}
if (unicode::ChangesWhenLowerCased(c)) {
break;
}
}
if (i == length) {
return str;
}
resultLength = length;
if (!newChars.maybeAlloc(cx, resultLength)) {
return nullptr;
}
PodCopy(newChars.get(), chars, i);
size_t readChars =
ToLowerCaseImpl(newChars.get(), chars, i, length, resultLength);
if (readChars < length) {
MOZ_ASSERT((!IsSame<CharT, Latin1Char>::value),
"Latin-1 strings don't have special lower case mappings");
resultLength = ToLowerCaseLength(chars, readChars, length);
if (!newChars.maybeRealloc(cx, length, resultLength)) {
return nullptr;
}
MOZ_ALWAYS_TRUE(length == ToLowerCaseImpl(newChars.get(), chars,
readChars, length,
resultLength));
}
}
return newChars.toStringDontDeflate(cx, resultLength);
}
JSString* js::StringToLowerCase(JSContext* cx, HandleString string) {
JSLinearString* linear = string->ensureLinear(cx);
if (!linear) {
return nullptr;
}
if (linear->hasLatin1Chars()) {
return ToLowerCase<Latin1Char>(cx, linear);
}
return ToLowerCase<char16_t>(cx, linear);
}
bool js::str_toLowerCase(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx, ToStringForStringFunction(cx, args.thisv()));
if (!str) {
return false;
}
JSString* result = StringToLowerCase(cx, str);
if (!result) {
return false;
}
args.rval().setString(result);
return true;
}
static const char* CaseMappingLocale(JSContext* cx, JSString* str) {
JSLinearString* locale = str->ensureLinear(cx);
if (!locale) {
return nullptr;
}
MOZ_ASSERT(locale->length() >= 2, "locale is a valid language tag");
static const char languagesWithSpecialCasing[][3] = {"lt", "tr", "az"};
if (locale->length() == 2 || locale->latin1OrTwoByteChar(2) == '-') {
for (const auto& language : languagesWithSpecialCasing) {
if (locale->latin1OrTwoByteChar(0) == language[0] &&
locale->latin1OrTwoByteChar(1) == language[1]) {
return language;
}
}
}
return ""; }
bool js::intl_toLocaleLowerCase(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
MOZ_ASSERT(args.length() == 2);
MOZ_ASSERT(args[0].isString());
MOZ_ASSERT(args[1].isString());
RootedString string(cx, args[0].toString());
const char* locale = CaseMappingLocale(cx, args[1].toString());
if (!locale) {
return false;
}
if (intl::StringsAreEqual(locale, "")) {
JSString* str = StringToLowerCase(cx, string);
if (!str) {
return false;
}
args.rval().setString(str);
return true;
}
AutoStableStringChars inputChars(cx);
if (!inputChars.initTwoByte(cx, string)) {
return false;
}
mozilla::Range<const char16_t> input = inputChars.twoByteRange();
static_assert(JSString::MAX_LENGTH <= INT32_MAX,
"String length must fit in int32_t for ICU");
static const size_t INLINE_CAPACITY = js::intl::INITIAL_CHAR_BUFFER_SIZE;
Vector<char16_t, INLINE_CAPACITY> chars(cx);
if (!chars.resize(Max(INLINE_CAPACITY, input.length()))) {
return false;
}
int32_t size = intl::CallICU(
cx,
[&input, locale](UChar* chars, int32_t size, UErrorCode* status) {
return u_strToLower(chars, size, input.begin().get(), input.length(),
locale, status);
},
chars);
if (size < 0) {
return false;
}
JSString* result = NewStringCopyN<CanGC>(cx, chars.begin(), size);
if (!result) {
return false;
}
args.rval().setString(result);
return true;
}
#if EXPOSE_INTL_API
#else
bool js::str_toLocaleLowerCase(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx, ToStringForStringFunction(cx, args.thisv()));
if (!str) {
return false;
}
if (cx->runtime()->localeCallbacks &&
cx->runtime()->localeCallbacks->localeToLowerCase) {
RootedValue result(cx);
if (!cx->runtime()->localeCallbacks->localeToLowerCase(cx, str, &result)) {
return false;
}
args.rval().set(result);
return true;
}
RootedLinearString linear(cx, str->ensureLinear(cx));
if (!linear) {
return false;
}
JSString* result = StringToLowerCase(cx, linear);
if (!result) {
return false;
}
args.rval().setString(result);
return true;
}
#endif
static inline bool ToUpperCaseHasSpecialCasing(Latin1Char charCode) {
bool hasUpperCaseSpecialCasing =
charCode == unicode::LATIN_SMALL_LETTER_SHARP_S;
MOZ_ASSERT(hasUpperCaseSpecialCasing ==
unicode::ChangesWhenUpperCasedSpecialCasing(charCode));
return hasUpperCaseSpecialCasing;
}
static inline bool ToUpperCaseHasSpecialCasing(char16_t charCode) {
return unicode::ChangesWhenUpperCasedSpecialCasing(charCode);
}
static inline size_t ToUpperCaseLengthSpecialCasing(Latin1Char charCode) {
MOZ_ASSERT(charCode == unicode::LATIN_SMALL_LETTER_SHARP_S);
return 2;
}
static inline size_t ToUpperCaseLengthSpecialCasing(char16_t charCode) {
MOZ_ASSERT(ToUpperCaseHasSpecialCasing(charCode));
return unicode::LengthUpperCaseSpecialCasing(charCode);
}
static inline void ToUpperCaseAppendUpperCaseSpecialCasing(char16_t charCode,
Latin1Char* elements,
size_t* index) {
MOZ_ASSERT(charCode == unicode::LATIN_SMALL_LETTER_SHARP_S);
static_assert('S' <= JSString::MAX_LATIN1_CHAR, "'S' is a Latin-1 character");
elements[(*index)++] = 'S';
elements[(*index)++] = 'S';
}
static inline void ToUpperCaseAppendUpperCaseSpecialCasing(char16_t charCode,
char16_t* elements,
size_t* index) {
unicode::AppendUpperCaseSpecialCasing(charCode, elements, index);
}
template <typename DestChar, typename SrcChar>
static size_t ToUpperCaseImpl(DestChar* destChars, const SrcChar* srcChars,
size_t startIndex, size_t srcLength,
size_t destLength) {
static_assert(IsSame<SrcChar, Latin1Char>::value ||
!IsSame<DestChar, Latin1Char>::value,
"cannot write non-Latin-1 characters into Latin-1 string");
MOZ_ASSERT(startIndex < srcLength);
MOZ_ASSERT(srcLength <= destLength);
size_t j = startIndex;
for (size_t i = startIndex; i < srcLength; i++) {
char16_t c = srcChars[i];
if (!IsSame<DestChar, Latin1Char>::value) {
if (unicode::IsLeadSurrogate(c) && i + 1 < srcLength) {
char16_t trail = srcChars[i + 1];
if (unicode::IsTrailSurrogate(trail)) {
trail = unicode::ToUpperCaseNonBMPTrail(c, trail);
destChars[j++] = c;
destChars[j++] = trail;
i++;
continue;
}
}
}
if (MOZ_UNLIKELY(c > 0x7f &&
ToUpperCaseHasSpecialCasing(static_cast<SrcChar>(c)))) {
if (srcLength == destLength) {
return i;
}
ToUpperCaseAppendUpperCaseSpecialCasing(c, destChars, &j);
continue;
}
c = unicode::ToUpperCase(c);
MOZ_ASSERT_IF((IsSame<DestChar, Latin1Char>::value),
c <= JSString::MAX_LATIN1_CHAR);
destChars[j++] = c;
}
MOZ_ASSERT(j == destLength);
return srcLength;
}
static bool ToUpperCaseImpl(Latin1Char* destChars, const char16_t* srcChars,
size_t startIndex, size_t srcLength,
size_t destLength) {
MOZ_ASSERT_UNREACHABLE(
"cannot write non-Latin-1 characters into Latin-1 string");
return false;
}
template <typename CharT>
static size_t ToUpperCaseLength(const CharT* chars, size_t startIndex,
size_t length) {
size_t upperLength = length;
for (size_t i = startIndex; i < length; i++) {
char16_t c = chars[i];
if (c > 0x7f && ToUpperCaseHasSpecialCasing(static_cast<CharT>(c))) {
upperLength += ToUpperCaseLengthSpecialCasing(static_cast<CharT>(c)) - 1;
}
}
return upperLength;
}
template <typename DestChar, typename SrcChar>
static inline void CopyChars(DestChar* destChars, const SrcChar* srcChars,
size_t length) {
static_assert(!IsSame<DestChar, SrcChar>::value,
"PodCopy is used for the same type case");
for (size_t i = 0; i < length; i++) {
destChars[i] = srcChars[i];
}
}
template <typename CharT>
static inline void CopyChars(CharT* destChars, const CharT* srcChars,
size_t length) {
PodCopy(destChars, srcChars, length);
}
template <typename DestChar, typename SrcChar>
static inline bool ToUpperCase(JSContext* cx,
InlineCharBuffer<DestChar>& newChars,
const SrcChar* chars, size_t startIndex,
size_t length, size_t* resultLength) {
MOZ_ASSERT(startIndex < length);
*resultLength = length;
if (!newChars.maybeAlloc(cx, length)) {
return false;
}
CopyChars(newChars.get(), chars, startIndex);
size_t readChars =
ToUpperCaseImpl(newChars.get(), chars, startIndex, length, length);
if (readChars < length) {
size_t actualLength = ToUpperCaseLength(chars, readChars, length);
*resultLength = actualLength;
if (!newChars.maybeRealloc(cx, length, actualLength)) {
return false;
}
MOZ_ALWAYS_TRUE(length == ToUpperCaseImpl(newChars.get(), chars, readChars,
length, actualLength));
}
return true;
}
template <typename CharT>
static JSString* ToUpperCase(JSContext* cx, JSLinearString* str) {
using Latin1Buffer = InlineCharBuffer<Latin1Char>;
using TwoByteBuffer = InlineCharBuffer<char16_t>;
mozilla::MaybeOneOf<Latin1Buffer, TwoByteBuffer> newChars;
const size_t length = str->length();
size_t resultLength;
{
AutoCheckCannotGC nogc;
const CharT* chars = str->chars<CharT>(nogc);
if (IsSame<CharT, Latin1Char>::value) {
if (length == 1) {
Latin1Char c = chars[0];
if (c != unicode::MICRO_SIGN &&
c != unicode::LATIN_SMALL_LETTER_Y_WITH_DIAERESIS &&
c != unicode::LATIN_SMALL_LETTER_SHARP_S) {
char16_t upper = unicode::ToUpperCase(c);
MOZ_ASSERT(upper <= JSString::MAX_LATIN1_CHAR);
MOZ_ASSERT(StaticStrings::hasUnit(upper));
return cx->staticStrings().getUnit(upper);
}
MOZ_ASSERT(unicode::ToUpperCase(c) > JSString::MAX_LATIN1_CHAR ||
ToUpperCaseHasSpecialCasing(c));
}
}
size_t i = 0;
for (; i < length; i++) {
CharT c = chars[i];
if (!IsSame<CharT, Latin1Char>::value) {
if (unicode::IsLeadSurrogate(c) && i + 1 < length) {
CharT trail = chars[i + 1];
if (unicode::IsTrailSurrogate(trail)) {
if (unicode::ChangesWhenUpperCasedNonBMP(c, trail)) {
break;
}
i++;
continue;
}
}
}
if (unicode::ChangesWhenUpperCased(c)) {
break;
}
if (MOZ_UNLIKELY(c > 0x7f && ToUpperCaseHasSpecialCasing(c))) {
break;
}
}
if (i == length) {
return str;
}
bool resultIsLatin1;
if (IsSame<CharT, Latin1Char>::value) {
resultIsLatin1 = true;
for (size_t j = i; j < length; j++) {
Latin1Char c = chars[j];
if (c == unicode::MICRO_SIGN ||
c == unicode::LATIN_SMALL_LETTER_Y_WITH_DIAERESIS) {
MOZ_ASSERT(unicode::ToUpperCase(c) > JSString::MAX_LATIN1_CHAR);
resultIsLatin1 = false;
break;
} else {
MOZ_ASSERT(unicode::ToUpperCase(c) <= JSString::MAX_LATIN1_CHAR);
}
}
} else {
resultIsLatin1 = false;
}
if (resultIsLatin1) {
newChars.construct<Latin1Buffer>();
if (!ToUpperCase(cx, newChars.ref<Latin1Buffer>(), chars, i, length,
&resultLength)) {
return nullptr;
}
} else {
newChars.construct<TwoByteBuffer>();
if (!ToUpperCase(cx, newChars.ref<TwoByteBuffer>(), chars, i, length,
&resultLength)) {
return nullptr;
}
}
}
return newChars.constructed<Latin1Buffer>()
? newChars.ref<Latin1Buffer>().toStringDontDeflate(cx,
resultLength)
: newChars.ref<TwoByteBuffer>().toStringDontDeflate(cx,
resultLength);
}
JSString* js::StringToUpperCase(JSContext* cx, HandleString string) {
JSLinearString* linear = string->ensureLinear(cx);
if (!linear) {
return nullptr;
}
if (linear->hasLatin1Chars()) {
return ToUpperCase<Latin1Char>(cx, linear);
}
return ToUpperCase<char16_t>(cx, linear);
}
bool js::str_toUpperCase(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx, ToStringForStringFunction(cx, args.thisv()));
if (!str) {
return false;
}
JSString* result = StringToUpperCase(cx, str);
if (!result) {
return false;
}
args.rval().setString(result);
return true;
}
bool js::intl_toLocaleUpperCase(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
MOZ_ASSERT(args.length() == 2);
MOZ_ASSERT(args[0].isString());
MOZ_ASSERT(args[1].isString());
RootedString string(cx, args[0].toString());
const char* locale = CaseMappingLocale(cx, args[1].toString());
if (!locale) {
return false;
}
if (intl::StringsAreEqual(locale, "")) {
JSString* str = js::StringToUpperCase(cx, string);
if (!str) {
return false;
}
args.rval().setString(str);
return true;
}
AutoStableStringChars inputChars(cx);
if (!inputChars.initTwoByte(cx, string)) {
return false;
}
mozilla::Range<const char16_t> input = inputChars.twoByteRange();
static_assert(JSString::MAX_LENGTH <= INT32_MAX,
"String length must fit in int32_t for ICU");
static const size_t INLINE_CAPACITY = js::intl::INITIAL_CHAR_BUFFER_SIZE;
Vector<char16_t, INLINE_CAPACITY> chars(cx);
if (!chars.resize(Max(INLINE_CAPACITY, input.length()))) {
return false;
}
int32_t size = intl::CallICU(
cx,
[&input, locale](UChar* chars, int32_t size, UErrorCode* status) {
return u_strToUpper(chars, size, input.begin().get(), input.length(),
locale, status);
},
chars);
if (size < 0) {
return false;
}
JSString* result = NewStringCopyN<CanGC>(cx, chars.begin(), size);
if (!result) {
return false;
}
args.rval().setString(result);
return true;
}
#if EXPOSE_INTL_API
#else
bool js::str_toLocaleUpperCase(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx, ToStringForStringFunction(cx, args.thisv()));
if (!str) {
return false;
}
if (cx->runtime()->localeCallbacks &&
cx->runtime()->localeCallbacks->localeToUpperCase) {
RootedValue result(cx);
if (!cx->runtime()->localeCallbacks->localeToUpperCase(cx, str, &result)) {
return false;
}
args.rval().set(result);
return true;
}
RootedLinearString linear(cx, str->ensureLinear(cx));
if (!linear) {
return false;
}
JSString* result = StringToUpperCase(cx, linear);
if (!result) {
return false;
}
args.rval().setString(result);
return true;
}
#endif
#if EXPOSE_INTL_API
#else
bool js::str_localeCompare(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx, ToStringForStringFunction(cx, args.thisv()));
if (!str) {
return false;
}
RootedString thatStr(cx, ToString<CanGC>(cx, args.get(0)));
if (!thatStr) {
return false;
}
if (cx->runtime()->localeCallbacks &&
cx->runtime()->localeCallbacks->localeCompare) {
RootedValue result(cx);
if (!cx->runtime()->localeCallbacks->localeCompare(cx, str, thatStr,
&result)) {
return false;
}
args.rval().set(result);
return true;
}
int32_t result;
if (!CompareStrings(cx, str, thatStr, &result)) {
return false;
}
args.rval().setInt32(result);
return true;
}
#endif
#if EXPOSE_INTL_API
bool js::str_normalize(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx, ToStringForStringFunction(cx, args.thisv()));
if (!str) {
return false;
}
enum NormalizationForm { NFC, NFD, NFKC, NFKD };
NormalizationForm form;
if (!args.hasDefined(0)) {
form = NFC;
} else {
JSLinearString* formStr = ArgToLinearString(cx, args, 0);
if (!formStr) {
return false;
}
if (EqualStrings(formStr, cx->names().NFC)) {
form = NFC;
} else if (EqualStrings(formStr, cx->names().NFD)) {
form = NFD;
} else if (EqualStrings(formStr, cx->names().NFKC)) {
form = NFKC;
} else if (EqualStrings(formStr, cx->names().NFKD)) {
form = NFKD;
} else {
JS_ReportErrorNumberASCII(cx, GetErrorMessage, nullptr,
JSMSG_INVALID_NORMALIZE_FORM);
return false;
}
}
if (form == NFC && str->hasLatin1Chars()) {
args.rval().setString(str);
return true;
}
AutoStableStringChars stableChars(cx);
if (!stableChars.initTwoByte(cx, str)) {
return false;
}
mozilla::Range<const char16_t> srcChars = stableChars.twoByteRange();
UErrorCode status = U_ZERO_ERROR;
const UNormalizer2* normalizer;
if (form == NFC) {
normalizer = unorm2_getNFCInstance(&status);
} else if (form == NFD) {
normalizer = unorm2_getNFDInstance(&status);
} else if (form == NFKC) {
normalizer = unorm2_getNFKCInstance(&status);
} else {
MOZ_ASSERT(form == NFKD);
normalizer = unorm2_getNFKDInstance(&status);
}
if (U_FAILURE(status)) {
JS_ReportErrorNumberASCII(cx, GetErrorMessage, nullptr,
JSMSG_INTERNAL_INTL_ERROR);
return false;
}
int32_t spanLengthInt = unorm2_spanQuickCheckYes(
normalizer, srcChars.begin().get(), srcChars.length(), &status);
if (U_FAILURE(status)) {
JS_ReportErrorNumberASCII(cx, GetErrorMessage, nullptr,
JSMSG_INTERNAL_INTL_ERROR);
return false;
}
MOZ_ASSERT(0 <= spanLengthInt && size_t(spanLengthInt) <= srcChars.length());
size_t spanLength = size_t(spanLengthInt);
if (spanLength == srcChars.length()) {
args.rval().setString(str);
return true;
}
static const size_t INLINE_CAPACITY = js::intl::INITIAL_CHAR_BUFFER_SIZE;
Vector<char16_t, INLINE_CAPACITY> chars(cx);
if (!chars.resize(Max(INLINE_CAPACITY, srcChars.length()))) {
return false;
}
if (spanLength > 0) {
PodCopy(chars.begin(), srcChars.begin().get(), spanLength);
}
int32_t size =
intl::CallICU(cx,
[normalizer, &srcChars, spanLength](
UChar* chars, uint32_t size, UErrorCode* status) {
mozilla::RangedPtr<const char16_t> remainingStart =
srcChars.begin() + spanLength;
size_t remainingLength = srcChars.length() - spanLength;
return unorm2_normalizeSecondAndAppend(
normalizer, chars, spanLength, size,
remainingStart.get(), remainingLength, status);
},
chars);
if (size < 0) {
return false;
}
JSString* ns = NewStringCopyN<CanGC>(cx, chars.begin(), size);
if (!ns) {
return false;
}
args.rval().setString(ns);
return true;
}
#endif
bool js::str_charAt(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx);
size_t i;
if (args.thisv().isString() && args.length() != 0 && args[0].isInt32()) {
str = args.thisv().toString();
i = size_t(args[0].toInt32());
if (i >= str->length()) {
goto out_of_range;
}
} else {
str = ToStringForStringFunction(cx, args.thisv());
if (!str) {
return false;
}
double d = 0.0;
if (args.length() > 0 && !ToInteger(cx, args[0], &d)) {
return false;
}
if (d < 0 || str->length() <= d) {
goto out_of_range;
}
i = size_t(d);
}
str = cx->staticStrings().getUnitStringForElement(cx, str, i);
if (!str) {
return false;
}
args.rval().setString(str);
return true;
out_of_range:
args.rval().setString(cx->runtime()->emptyString);
return true;
}
bool js::str_charCodeAt_impl(JSContext* cx, HandleString string,
HandleValue index, MutableHandleValue res) {
size_t i;
if (index.isInt32()) {
i = index.toInt32();
if (i >= string->length()) {
goto out_of_range;
}
} else {
double d = 0.0;
if (!ToInteger(cx, index, &d)) {
return false;
}
if (d < 0 || string->length() <= d) {
goto out_of_range;
}
i = size_t(d);
}
char16_t c;
if (!string->getChar(cx, i, &c)) {
return false;
}
res.setInt32(c);
return true;
out_of_range:
res.setNaN();
return true;
}
bool js::str_charCodeAt(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx);
RootedValue index(cx);
if (args.thisv().isString()) {
str = args.thisv().toString();
} else {
str = ToStringForStringFunction(cx, args.thisv());
if (!str) {
return false;
}
}
if (args.length() != 0) {
index = args[0];
} else {
index.setInt32(0);
}
return js::str_charCodeAt_impl(cx, str, index, args.rval());
}
static const uint32_t sBMHCharSetSize = 256;
static const uint32_t sBMHPatLenMax = 255;
static const int sBMHBadPattern =
-2;
template <typename TextChar, typename PatChar>
static int BoyerMooreHorspool(const TextChar* text, uint32_t textLen,
const PatChar* pat, uint32_t patLen) {
MOZ_ASSERT(0 < patLen && patLen <= sBMHPatLenMax);
uint8_t skip[sBMHCharSetSize];
for (uint32_t i = 0; i < sBMHCharSetSize; i++) {
skip[i] = uint8_t(patLen);
}
uint32_t patLast = patLen - 1;
for (uint32_t i = 0; i < patLast; i++) {
char16_t c = pat[i];
if (c >= sBMHCharSetSize) {
return sBMHBadPattern;
}
skip[c] = uint8_t(patLast - i);
}
for (uint32_t k = patLast; k < textLen;) {
for (uint32_t i = k, j = patLast;; i--, j--) {
if (text[i] != pat[j]) {
break;
}
if (j == 0) {
return static_cast<int>(i);
}
}
char16_t c = text[k];
k += (c >= sBMHCharSetSize) ? patLen : skip[c];
}
return -1;
}
template <typename TextChar, typename PatChar>
struct MemCmp {
typedef uint32_t Extent;
static MOZ_ALWAYS_INLINE Extent computeExtent(const PatChar*,
uint32_t patLen) {
return (patLen - 1) * sizeof(PatChar);
}
static MOZ_ALWAYS_INLINE bool match(const PatChar* p, const TextChar* t,
Extent extent) {
MOZ_ASSERT(sizeof(TextChar) == sizeof(PatChar));
return memcmp(p, t, extent) == 0;
}
};
template <typename TextChar, typename PatChar>
struct ManualCmp {
typedef const PatChar* Extent;
static MOZ_ALWAYS_INLINE Extent computeExtent(const PatChar* pat,
uint32_t patLen) {
return pat + patLen;
}
static MOZ_ALWAYS_INLINE bool match(const PatChar* p, const TextChar* t,
Extent extent) {
for (; p != extent; ++p, ++t) {
if (*p != *t) {
return false;
}
}
return true;
}
};
template <typename TextChar, typename PatChar>
static const TextChar* FirstCharMatcherUnrolled(const TextChar* text,
uint32_t n, const PatChar pat) {
const TextChar* textend = text + n;
const TextChar* t = text;
switch ((textend - t) & 7) {
case 0:
if (*t++ == pat) return t - 1;
MOZ_FALLTHROUGH;
case 7:
if (*t++ == pat) return t - 1;
MOZ_FALLTHROUGH;
case 6:
if (*t++ == pat) return t - 1;
MOZ_FALLTHROUGH;
case 5:
if (*t++ == pat) return t - 1;
MOZ_FALLTHROUGH;
case 4:
if (*t++ == pat) return t - 1;
MOZ_FALLTHROUGH;
case 3:
if (*t++ == pat) return t - 1;
MOZ_FALLTHROUGH;
case 2:
if (*t++ == pat) return t - 1;
MOZ_FALLTHROUGH;
case 1:
if (*t++ == pat) return t - 1;
}
while (textend != t) {
if (t[0] == pat) return t;
if (t[1] == pat) return t + 1;
if (t[2] == pat) return t + 2;
if (t[3] == pat) return t + 3;
if (t[4] == pat) return t + 4;
if (t[5] == pat) return t + 5;
if (t[6] == pat) return t + 6;
if (t[7] == pat) return t + 7;
t += 8;
}
return nullptr;
}
static const char* FirstCharMatcher8bit(const char* text, uint32_t n,
const char pat) {
return reinterpret_cast<const char*>(memchr(text, pat, n));
}
template <class InnerMatch, typename TextChar, typename PatChar>
static int Matcher(const TextChar* text, uint32_t textlen, const PatChar* pat,
uint32_t patlen) {
MOZ_ASSERT(patlen > 0);
if (sizeof(TextChar) == 1 && sizeof(PatChar) > 1 && pat[0] > 0xff) {
return -1;
}
const typename InnerMatch::Extent extent =
InnerMatch::computeExtent(pat, patlen);
uint32_t i = 0;
uint32_t n = textlen - patlen + 1;
while (i < n) {
const TextChar* pos;
if (sizeof(TextChar) == 1) {
MOZ_ASSERT(pat[0] <= 0xff);
pos = (TextChar*)FirstCharMatcher8bit((char*)text + i, n - i, pat[0]);
} else {
pos = FirstCharMatcherUnrolled(text + i, n - i, char16_t(pat[0]));
}
if (pos == nullptr) {
return -1;
}
i = static_cast<uint32_t>(pos - text);
if (InnerMatch::match(pat + 1, text + i + 1, extent)) {
return i;
}
i += 1;
}
return -1;
}
template <typename TextChar, typename PatChar>
static MOZ_ALWAYS_INLINE int StringMatch(const TextChar* text, uint32_t textLen,
const PatChar* pat, uint32_t patLen) {
if (patLen == 0) {
return 0;
}
if (textLen < patLen) {
return -1;
}
#if defined(__i386__) || defined(_M_IX86) || defined(__i386)
if (patLen == 1) {
const PatChar p0 = *pat;
const TextChar* end = text + textLen;
for (const TextChar* c = text; c != end; ++c) {
if (*c == p0) {
return c - text;
}
}
return -1;
}
#endif
if (textLen >= 512 && patLen >= 11 && patLen <= sBMHPatLenMax) {
int index = BoyerMooreHorspool(text, textLen, pat, patLen);
if (index != sBMHBadPattern) {
return index;
}
}
return (patLen > 128 && IsSame<TextChar, PatChar>::value)
? Matcher<MemCmp<TextChar, PatChar>, TextChar, PatChar>(
text, textLen, pat, patLen)
: Matcher<ManualCmp<TextChar, PatChar>, TextChar, PatChar>(
text, textLen, pat, patLen);
}
static int32_t StringMatch(JSLinearString* text, JSLinearString* pat,
uint32_t start = 0) {
MOZ_ASSERT(start <= text->length());
uint32_t textLen = text->length() - start;
uint32_t patLen = pat->length();
int match;
AutoCheckCannotGC nogc;
if (text->hasLatin1Chars()) {
const Latin1Char* textChars = text->latin1Chars(nogc) + start;
if (pat->hasLatin1Chars()) {
match = StringMatch(textChars, textLen, pat->latin1Chars(nogc), patLen);
} else {
match = StringMatch(textChars, textLen, pat->twoByteChars(nogc), patLen);
}
} else {
const char16_t* textChars = text->twoByteChars(nogc) + start;
if (pat->hasLatin1Chars()) {
match = StringMatch(textChars, textLen, pat->latin1Chars(nogc), patLen);
} else {
match = StringMatch(textChars, textLen, pat->twoByteChars(nogc), patLen);
}
}
return (match == -1) ? -1 : start + match;
}
static const size_t sRopeMatchThresholdRatioLog2 = 4;
int js::StringFindPattern(JSLinearString* text, JSLinearString* pat,
size_t start) {
return StringMatch(text, pat, start);
}
class StringSegmentRange {
using StackVector = JS::GCVector<JSString*, 16>;
Rooted<StackVector> stack;
RootedLinearString cur;
bool settle(JSString* str) {
while (str->isRope()) {
JSRope& rope = str->asRope();
if (!stack.append(rope.rightChild())) {
return false;
}
str = rope.leftChild();
}
cur = &str->asLinear();
return true;
}
public:
explicit StringSegmentRange(JSContext* cx)
: stack(cx, StackVector(cx)), cur(cx) {}
MOZ_MUST_USE bool init(JSString* str) {
MOZ_ASSERT(stack.empty());
return settle(str);
}
bool empty() const { return cur == nullptr; }
JSLinearString* front() const {
MOZ_ASSERT(!cur->isRope());
return cur;
}
MOZ_MUST_USE bool popFront() {
MOZ_ASSERT(!empty());
if (stack.empty()) {
cur = nullptr;
return true;
}
return settle(stack.popCopy());
}
};
typedef Vector<JSLinearString*, 16, SystemAllocPolicy> LinearStringVector;
template <typename TextChar, typename PatChar>
static int RopeMatchImpl(const AutoCheckCannotGC& nogc,
LinearStringVector& strings, const PatChar* pat,
size_t patLen) {
int pos = 0;
for (JSLinearString** outerp = strings.begin(); outerp != strings.end();
++outerp) {
JSLinearString* outer = *outerp;
const TextChar* chars = outer->chars<TextChar>(nogc);
size_t len = outer->length();
int matchResult = StringMatch(chars, len, pat, patLen);
if (matchResult != -1) {
return pos + matchResult;
}
const TextChar* const text = chars + (patLen > len ? 0 : len - patLen + 1);
const TextChar* const textend = chars + len;
const PatChar p0 = *pat;
const PatChar* const p1 = pat + 1;
const PatChar* const patend = pat + patLen;
for (const TextChar* t = text; t != textend;) {
if (*t++ != p0) {
continue;
}
JSLinearString** innerp = outerp;
const TextChar* ttend = textend;
const TextChar* tt = t;
for (const PatChar* pp = p1; pp != patend; ++pp, ++tt) {
while (tt == ttend) {
if (++innerp == strings.end()) {
return -1;
}
JSLinearString* inner = *innerp;
tt = inner->chars<TextChar>(nogc);
ttend = tt + inner->length();
}
if (*pp != *tt) {
goto break_continue;
}
}
return pos + (t - chars) - 1;
break_continue:;
}
pos += len;
}
return -1;
}
static bool RopeMatch(JSContext* cx, JSRope* text, JSLinearString* pat,
int* match) {
uint32_t patLen = pat->length();
if (patLen == 0) {
*match = 0;
return true;
}
if (text->length() < patLen) {
*match = -1;
return true;
}
LinearStringVector strings;
{
size_t threshold = text->length() >> sRopeMatchThresholdRatioLog2;
StringSegmentRange r(cx);
if (!r.init(text)) {
return false;
}
bool textIsLatin1 = text->hasLatin1Chars();
while (!r.empty()) {
if (threshold-- == 0 || r.front()->hasLatin1Chars() != textIsLatin1 ||
!strings.append(r.front())) {
JSLinearString* linear = text->ensureLinear(cx);
if (!linear) {
return false;
}
*match = StringMatch(linear, pat);
return true;
}
if (!r.popFront()) {
return false;
}
}
}
AutoCheckCannotGC nogc;
if (text->hasLatin1Chars()) {
if (pat->hasLatin1Chars()) {
*match = RopeMatchImpl<Latin1Char>(nogc, strings, pat->latin1Chars(nogc),
patLen);
} else {
*match = RopeMatchImpl<Latin1Char>(nogc, strings, pat->twoByteChars(nogc),
patLen);
}
} else {
if (pat->hasLatin1Chars()) {
*match = RopeMatchImpl<char16_t>(nogc, strings, pat->latin1Chars(nogc),
patLen);
} else {
*match = RopeMatchImpl<char16_t>(nogc, strings, pat->twoByteChars(nogc),
patLen);
}
}
return true;
}
static MOZ_ALWAYS_INLINE bool ReportErrorIfFirstArgIsRegExp(
JSContext* cx, const CallArgs& args) {
if (args.length() == 0 || !args[0].isObject()) {
return true;
}
bool isRegExp;
if (!IsRegExp(cx, args[0], &isRegExp)) {
return false;
}
if (isRegExp) {
JS_ReportErrorNumberASCII(cx, GetErrorMessage, nullptr,
JSMSG_INVALID_ARG_TYPE, "first", "",
"Regular Expression");
return false;
}
return true;
}
bool js::str_includes(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx, ToStringForStringFunction(cx, args.thisv()));
if (!str) {
return false;
}
if (!ReportErrorIfFirstArgIsRegExp(cx, args)) {
return false;
}
RootedLinearString searchStr(cx, ArgToLinearString(cx, args, 0));
if (!searchStr) {
return false;
}
uint32_t pos = 0;
if (args.hasDefined(1)) {
if (args[1].isInt32()) {
int i = args[1].toInt32();
pos = (i < 0) ? 0U : uint32_t(i);
} else {
double d;
if (!ToInteger(cx, args[1], &d)) {
return false;
}
pos = uint32_t(Min(Max(d, 0.0), double(UINT32_MAX)));
}
}
uint32_t textLen = str->length();
uint32_t start = Min(Max(pos, 0U), textLen);
JSLinearString* text = str->ensureLinear(cx);
if (!text) {
return false;
}
args.rval().setBoolean(StringMatch(text, searchStr, start) != -1);
return true;
}
bool js::str_indexOf(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx, ToStringForStringFunction(cx, args.thisv()));
if (!str) {
return false;
}
RootedLinearString searchStr(cx, ArgToLinearString(cx, args, 0));
if (!searchStr) {
return false;
}
uint32_t pos = 0;
if (args.hasDefined(1)) {
if (args[1].isInt32()) {
int i = args[1].toInt32();
pos = (i < 0) ? 0U : uint32_t(i);
} else {
double d;
if (!ToInteger(cx, args[1], &d)) {
return false;
}
pos = uint32_t(Min(Max(d, 0.0), double(UINT32_MAX)));
}
}
uint32_t textLen = str->length();
uint32_t start = Min(Max(pos, 0U), textLen);
if (str == searchStr) {
args.rval().setInt32(start == 0 ? 0 : -1);
return true;
}
JSLinearString* text = str->ensureLinear(cx);
if (!text) {
return false;
}
args.rval().setInt32(StringMatch(text, searchStr, start));
return true;
}
template <typename TextChar, typename PatChar>
static int32_t LastIndexOfImpl(const TextChar* text, size_t textLen,
const PatChar* pat, size_t patLen,
size_t start) {
MOZ_ASSERT(patLen > 0);
MOZ_ASSERT(patLen <= textLen);
MOZ_ASSERT(start <= textLen - patLen);
const PatChar p0 = *pat;
const PatChar* patNext = pat + 1;
const PatChar* patEnd = pat + patLen;
for (const TextChar* t = text + start; t >= text; --t) {
if (*t == p0) {
const TextChar* t1 = t + 1;
for (const PatChar* p1 = patNext; p1 < patEnd; ++p1, ++t1) {
if (*t1 != *p1) {
goto break_continue;
}
}
return static_cast<int32_t>(t - text);
}
break_continue:;
}
return -1;
}
bool js::str_lastIndexOf(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx, ToStringForStringFunction(cx, args.thisv()));
if (!str) {
return false;
}
RootedLinearString searchStr(cx, ArgToLinearString(cx, args, 0));
if (!searchStr) {
return false;
}
size_t len = str->length();
size_t searchLen = searchStr->length();
int start = len - searchLen; if (args.hasDefined(1)) {
if (args[1].isInt32()) {
int i = args[1].toInt32();
if (i <= 0) {
start = 0;
} else if (i < start) {
start = i;
}
} else {
double d;
if (!ToNumber(cx, args[1], &d)) {
return false;
}
if (!IsNaN(d)) {
d = JS::ToInteger(d);
if (d <= 0) {
start = 0;
} else if (d < start) {
start = int(d);
}
}
}
}
if (str == searchStr) {
args.rval().setInt32(0);
return true;
}
if (searchLen > len) {
args.rval().setInt32(-1);
return true;
}
if (searchLen == 0) {
args.rval().setInt32(start);
return true;
}
MOZ_ASSERT(0 <= start && size_t(start) < len);
JSLinearString* text = str->ensureLinear(cx);
if (!text) {
return false;
}
int32_t res;
AutoCheckCannotGC nogc;
if (text->hasLatin1Chars()) {
const Latin1Char* textChars = text->latin1Chars(nogc);
if (searchStr->hasLatin1Chars()) {
res = LastIndexOfImpl(textChars, len, searchStr->latin1Chars(nogc),
searchLen, start);
} else {
res = LastIndexOfImpl(textChars, len, searchStr->twoByteChars(nogc),
searchLen, start);
}
} else {
const char16_t* textChars = text->twoByteChars(nogc);
if (searchStr->hasLatin1Chars()) {
res = LastIndexOfImpl(textChars, len, searchStr->latin1Chars(nogc),
searchLen, start);
} else {
res = LastIndexOfImpl(textChars, len, searchStr->twoByteChars(nogc),
searchLen, start);
}
}
args.rval().setInt32(res);
return true;
}
bool js::str_startsWith(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx, ToStringForStringFunction(cx, args.thisv()));
if (!str) {
return false;
}
if (!ReportErrorIfFirstArgIsRegExp(cx, args)) {
return false;
}
RootedLinearString searchStr(cx, ArgToLinearString(cx, args, 0));
if (!searchStr) {
return false;
}
uint32_t pos = 0;
if (args.hasDefined(1)) {
if (args[1].isInt32()) {
int i = args[1].toInt32();
pos = (i < 0) ? 0U : uint32_t(i);
} else {
double d;
if (!ToInteger(cx, args[1], &d)) {
return false;
}
pos = uint32_t(Min(Max(d, 0.0), double(UINT32_MAX)));
}
}
uint32_t textLen = str->length();
uint32_t start = Min(Max(pos, 0U), textLen);
uint32_t searchLen = searchStr->length();
if (searchLen + start < searchLen || searchLen + start > textLen) {
args.rval().setBoolean(false);
return true;
}
JSLinearString* text = str->ensureLinear(cx);
if (!text) {
return false;
}
args.rval().setBoolean(HasSubstringAt(text, searchStr, start));
return true;
}
bool js::str_endsWith(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx, ToStringForStringFunction(cx, args.thisv()));
if (!str) {
return false;
}
if (!ReportErrorIfFirstArgIsRegExp(cx, args)) {
return false;
}
RootedLinearString searchStr(cx, ArgToLinearString(cx, args, 0));
if (!searchStr) {
return false;
}
uint32_t textLen = str->length();
uint32_t pos = textLen;
if (args.hasDefined(1)) {
if (args[1].isInt32()) {
int i = args[1].toInt32();
pos = (i < 0) ? 0U : uint32_t(i);
} else {
double d;
if (!ToInteger(cx, args[1], &d)) {
return false;
}
pos = uint32_t(Min(Max(d, 0.0), double(UINT32_MAX)));
}
}
uint32_t end = Min(Max(pos, 0U), textLen);
uint32_t searchLen = searchStr->length();
if (searchLen > end) {
args.rval().setBoolean(false);
return true;
}
uint32_t start = end - searchLen;
JSLinearString* text = str->ensureLinear(cx);
if (!text) {
return false;
}
args.rval().setBoolean(HasSubstringAt(text, searchStr, start));
return true;
}
template <typename CharT>
static void TrimString(const CharT* chars, bool trimStart, bool trimEnd,
size_t length, size_t* pBegin, size_t* pEnd) {
size_t begin = 0, end = length;
if (trimStart) {
while (begin < length && unicode::IsSpace(chars[begin])) {
++begin;
}
}
if (trimEnd) {
while (end > begin && unicode::IsSpace(chars[end - 1])) {
--end;
}
}
*pBegin = begin;
*pEnd = end;
}
static bool TrimString(JSContext* cx, const CallArgs& args, bool trimStart,
bool trimEnd) {
JSString* str = ToStringForStringFunction(cx, args.thisv());
if (!str) {
return false;
}
JSLinearString* linear = str->ensureLinear(cx);
if (!linear) {
return false;
}
size_t length = linear->length();
size_t begin, end;
if (linear->hasLatin1Chars()) {
AutoCheckCannotGC nogc;
TrimString(linear->latin1Chars(nogc), trimStart, trimEnd, length, &begin,
&end);
} else {
AutoCheckCannotGC nogc;
TrimString(linear->twoByteChars(nogc), trimStart, trimEnd, length, &begin,
&end);
}
JSLinearString* result = NewDependentString(cx, linear, begin, end - begin);
if (!result) {
return false;
}
args.rval().setString(result);
return true;
}
bool js::str_trim(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
return TrimString(cx, args, true, true);
}
bool js::str_trimStart(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
return TrimString(cx, args, true, false);
}
bool js::str_trimEnd(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
return TrimString(cx, args, false, true);
}
class RopeBuilder {
JSContext* cx;
RootedString res;
RopeBuilder(const RopeBuilder& other) = delete;
void operator=(const RopeBuilder& other) = delete;
public:
explicit RopeBuilder(JSContext* cx)
: cx(cx), res(cx, cx->runtime()->emptyString) {}
inline bool append(HandleString str) {
res = ConcatStrings<CanGC>(cx, res, str);
return !!res;
}
inline JSString* result() { return res; }
};
namespace {
template <typename CharT>
static uint32_t FindDollarIndex(const CharT* chars, size_t length) {
if (const CharT* p = js_strchr_limit(chars, '$', chars + length)) {
uint32_t dollarIndex = p - chars;
MOZ_ASSERT(dollarIndex < length);
return dollarIndex;
}
return UINT32_MAX;
}
}
static JSString* BuildFlatReplacement(JSContext* cx, HandleString textstr,
HandleLinearString repstr,
size_t matchStart, size_t patternLength) {
size_t matchEnd = matchStart + patternLength;
RootedString resultStr(cx, NewDependentString(cx, textstr, 0, matchStart));
if (!resultStr) {
return nullptr;
}
resultStr = ConcatStrings<CanGC>(cx, resultStr, repstr);
if (!resultStr) {
return nullptr;
}
MOZ_ASSERT(textstr->length() >= matchEnd);
RootedString rest(cx, NewDependentString(cx, textstr, matchEnd,
textstr->length() - matchEnd));
if (!rest) {
return nullptr;
}
return ConcatStrings<CanGC>(cx, resultStr, rest);
}
static JSString* BuildFlatRopeReplacement(JSContext* cx, HandleString textstr,
HandleLinearString repstr,
size_t match, size_t patternLength) {
MOZ_ASSERT(textstr->isRope());
size_t matchEnd = match + patternLength;
StringSegmentRange r(cx);
if (!r.init(textstr)) {
return nullptr;
}
RopeBuilder builder(cx);
if (patternLength == 0) {
MOZ_ASSERT(match == 0);
if (!builder.append(repstr)) {
return nullptr;
}
}
size_t pos = 0;
while (!r.empty()) {
RootedString str(cx, r.front());
size_t len = str->length();
size_t strEnd = pos + len;
if (pos < matchEnd && strEnd > match) {
if (match >= pos) {
RootedString leftSide(cx, NewDependentString(cx, str, 0, match - pos));
if (!leftSide || !builder.append(leftSide) || !builder.append(repstr)) {
return nullptr;
}
}
if (strEnd > matchEnd) {
RootedString rightSide(
cx, NewDependentString(cx, str, matchEnd - pos, strEnd - matchEnd));
if (!rightSide || !builder.append(rightSide)) {
return nullptr;
}
}
} else {
if (!builder.append(str)) {
return nullptr;
}
}
pos += str->length();
if (!r.popFront()) {
return nullptr;
}
}
return builder.result();
}
template <typename CharT>
static bool AppendDollarReplacement(StringBuffer& newReplaceChars,
size_t firstDollarIndex, size_t matchStart,
size_t matchLimit, JSLinearString* text,
const CharT* repChars, size_t repLength) {
MOZ_ASSERT(firstDollarIndex < repLength);
newReplaceChars.infallibleAppend(repChars, firstDollarIndex);
const CharT* repLimit = repChars + repLength;
for (const CharT* it = repChars + firstDollarIndex; it < repLimit; ++it) {
if (*it != '$' || it == repLimit - 1) {
if (!newReplaceChars.append(*it)) {
return false;
}
continue;
}
switch (*(it + 1)) {
case '$':
if (!newReplaceChars.append(*it)) {
return false;
}
break;
case '&':
if (!newReplaceChars.appendSubstring(text, matchStart,
matchLimit - matchStart)) {
return false;
}
break;
case '`':
if (!newReplaceChars.appendSubstring(text, 0, matchStart)) {
return false;
}
break;
case '\'':
if (!newReplaceChars.appendSubstring(text, matchLimit,
text->length() - matchLimit)) {
return false;
}
break;
default:
if (!newReplaceChars.append(*it)) {
return false;
}
continue;
}
++it; }
return true;
}
static JSLinearString* InterpretDollarReplacement(
JSContext* cx, HandleString textstrArg, HandleLinearString repstr,
uint32_t firstDollarIndex, size_t matchStart, size_t patternLength) {
RootedLinearString textstr(cx, textstrArg->ensureLinear(cx));
if (!textstr) {
return nullptr;
}
size_t matchLimit = matchStart + patternLength;
StringBuffer newReplaceChars(cx);
if (repstr->hasTwoByteChars() && !newReplaceChars.ensureTwoByteChars()) {
return nullptr;
}
if (!newReplaceChars.reserve(textstr->length() - patternLength +
repstr->length())) {
return nullptr;
}
bool res;
if (repstr->hasLatin1Chars()) {
AutoCheckCannotGC nogc;
res = AppendDollarReplacement(newReplaceChars, firstDollarIndex, matchStart,
matchLimit, textstr,
repstr->latin1Chars(nogc), repstr->length());
} else {
AutoCheckCannotGC nogc;
res = AppendDollarReplacement(newReplaceChars, firstDollarIndex, matchStart,
matchLimit, textstr,
repstr->twoByteChars(nogc), repstr->length());
}
if (!res) {
return nullptr;
}
return newReplaceChars.finishString();
}
template <typename StrChar, typename RepChar>
static bool StrFlatReplaceGlobal(JSContext* cx, JSLinearString* str,
JSLinearString* pat, JSLinearString* rep,
StringBuffer& sb) {
MOZ_ASSERT(str->length() > 0);
AutoCheckCannotGC nogc;
const StrChar* strChars = str->chars<StrChar>(nogc);
const RepChar* repChars = rep->chars<RepChar>(nogc);
if (!pat->length()) {
CheckedInt<uint32_t> strLength(str->length());
CheckedInt<uint32_t> repLength(rep->length());
CheckedInt<uint32_t> length = repLength * (strLength - 1) + strLength;
if (!length.isValid()) {
ReportAllocationOverflow(cx);
return false;
}
if (!sb.reserve(length.value())) {
return false;
}
for (unsigned i = 0; i < str->length() - 1; ++i, ++strChars) {
sb.infallibleAppend(*strChars);
sb.infallibleAppend(repChars, rep->length());
}
sb.infallibleAppend(*strChars);
return true;
}
if (rep->length() >= pat->length()) {
if (!sb.reserve(str->length())) {
return false;
}
}
uint32_t start = 0;
for (;;) {
int match = StringMatch(str, pat, start);
if (match < 0) {
break;
}
if (!sb.append(strChars + start, match - start)) {
return false;
}
if (!sb.append(repChars, rep->length())) {
return false;
}
start = match + pat->length();
}
if (!sb.append(strChars + start, str->length() - start)) {
return false;
}
return true;
}
JSString* js::StringFlatReplaceString(JSContext* cx, HandleString string,
HandleString pattern,
HandleString replacement) {
MOZ_ASSERT(string);
MOZ_ASSERT(pattern);
MOZ_ASSERT(replacement);
if (!string->length()) {
return string;
}
RootedLinearString linearRepl(cx, replacement->ensureLinear(cx));
if (!linearRepl) {
return nullptr;
}
RootedLinearString linearPat(cx, pattern->ensureLinear(cx));
if (!linearPat) {
return nullptr;
}
RootedLinearString linearStr(cx, string->ensureLinear(cx));
if (!linearStr) {
return nullptr;
}
StringBuffer sb(cx);
if (linearStr->hasTwoByteChars()) {
if (!sb.ensureTwoByteChars()) {
return nullptr;
}
if (linearRepl->hasTwoByteChars()) {
if (!StrFlatReplaceGlobal<char16_t, char16_t>(cx, linearStr, linearPat,
linearRepl, sb)) {
return nullptr;
}
} else {
if (!StrFlatReplaceGlobal<char16_t, Latin1Char>(cx, linearStr, linearPat,
linearRepl, sb)) {
return nullptr;
}
}
} else {
if (linearRepl->hasTwoByteChars()) {
if (!sb.ensureTwoByteChars()) {
return nullptr;
}
if (!StrFlatReplaceGlobal<Latin1Char, char16_t>(cx, linearStr, linearPat,
linearRepl, sb)) {
return nullptr;
}
} else {
if (!StrFlatReplaceGlobal<Latin1Char, Latin1Char>(
cx, linearStr, linearPat, linearRepl, sb)) {
return nullptr;
}
}
}
return sb.finishString();
}
JSString* js::str_replace_string_raw(JSContext* cx, HandleString string,
HandleString pattern,
HandleString replacement) {
RootedLinearString repl(cx, replacement->ensureLinear(cx));
if (!repl) {
return nullptr;
}
RootedLinearString pat(cx, pattern->ensureLinear(cx));
if (!pat) {
return nullptr;
}
size_t patternLength = pat->length();
int32_t match;
uint32_t dollarIndex;
{
AutoCheckCannotGC nogc;
dollarIndex =
repl->hasLatin1Chars()
? FindDollarIndex(repl->latin1Chars(nogc), repl->length())
: FindDollarIndex(repl->twoByteChars(nogc), repl->length());
}
if (string->isRope()) {
if (!RopeMatch(cx, &string->asRope(), pat, &match)) {
return nullptr;
}
} else {
match = StringMatch(&string->asLinear(), pat, 0);
}
if (match < 0) {
return string;
}
if (dollarIndex != UINT32_MAX) {
repl = InterpretDollarReplacement(cx, string, repl, dollarIndex, match,
patternLength);
if (!repl) {
return nullptr;
}
} else if (string->isRope()) {
return BuildFlatRopeReplacement(cx, string, repl, match, patternLength);
}
return BuildFlatReplacement(cx, string, repl, match, patternLength);
}
static ArrayObject* NewFullyAllocatedStringArray(JSContext* cx,
HandleObjectGroup group,
uint32_t length) {
ArrayObject* array = NewFullyAllocatedArrayTryUseGroup(cx, group, length);
if (!array) {
return nullptr;
}
MOZ_ASSERT(length > 0);
AddTypePropertyId(cx, array, JSID_VOID, TypeSet::StringType());
return array;
}
static ArrayObject* SingleElementStringArray(JSContext* cx,
HandleObjectGroup group,
HandleLinearString str) {
ArrayObject* array = NewFullyAllocatedStringArray(cx, group, 1);
if (!array) {
return nullptr;
}
array->setDenseInitializedLength(1);
array->initDenseElement(0, StringValue(str));
return array;
}
static ArrayObject* SplitHelper(JSContext* cx, HandleLinearString str,
uint32_t limit, HandleLinearString sep,
HandleObjectGroup group) {
size_t strLength = str->length();
size_t sepLength = sep->length();
MOZ_ASSERT(sepLength != 0);
if (strLength == 0) {
int match = StringMatch(str, sep, 0);
if (match != -1) {
return NewFullyAllocatedArrayTryUseGroup(cx, group, 0);
}
return SingleElementStringArray(cx, group, str);
}
AutoValueVector splits(cx);
size_t lastEndIndex = 0;
size_t index = 0;
while (index != strLength) {
int match = StringMatch(str, sep, index);
if (match == -1) {
break;
}
size_t endIndex = match + sepLength;
if (endIndex == lastEndIndex) {
index++;
continue;
}
MOZ_ASSERT(lastEndIndex < endIndex);
MOZ_ASSERT(sepLength <= strLength);
MOZ_ASSERT(lastEndIndex + sepLength <= endIndex);
size_t subLength = size_t(endIndex - sepLength - lastEndIndex);
JSString* sub = NewDependentString(cx, str, lastEndIndex, subLength);
if (!sub || !splits.append(StringValue(sub))) {
return nullptr;
}
if (splits.length() == limit) {
return NewCopiedArrayTryUseGroup(cx, group, splits.begin(),
splits.length());
}
index = endIndex;
lastEndIndex = index;
}
JSString* sub =
NewDependentString(cx, str, lastEndIndex, strLength - lastEndIndex);
if (!sub || !splits.append(StringValue(sub))) {
return nullptr;
}
return NewCopiedArrayTryUseGroup(cx, group, splits.begin(), splits.length());
}
static ArrayObject* CharSplitHelper(JSContext* cx, HandleLinearString str,
uint32_t limit, HandleObjectGroup group) {
size_t strLength = str->length();
if (strLength == 0) {
return NewFullyAllocatedArrayTryUseGroup(cx, group, 0);
}
js::StaticStrings& staticStrings = cx->staticStrings();
uint32_t resultlen = (limit < strLength ? limit : strLength);
MOZ_ASSERT(limit > 0 && resultlen > 0,
"Neither limit nor strLength is zero, so resultlen is greater "
"than zero.");
RootedArrayObject splits(cx,
NewFullyAllocatedStringArray(cx, group, resultlen));
if (!splits) {
return nullptr;
}
if (str->hasLatin1Chars()) {
splits->setDenseInitializedLength(resultlen);
JS::AutoCheckCannotGC nogc;
const Latin1Char* latin1Chars = str->latin1Chars(nogc);
for (size_t i = 0; i < resultlen; ++i) {
Latin1Char c = latin1Chars[i];
MOZ_ASSERT(staticStrings.hasUnit(c));
splits->initDenseElement(i, StringValue(staticStrings.getUnit(c)));
}
} else {
splits->ensureDenseInitializedLength(cx, 0, resultlen);
for (size_t i = 0; i < resultlen; ++i) {
JSString* sub = staticStrings.getUnitStringForElement(cx, str, i);
if (!sub) {
return nullptr;
}
splits->initDenseElement(i, StringValue(sub));
}
}
return splits;
}
template <typename TextChar>
static MOZ_ALWAYS_INLINE ArrayObject* SplitSingleCharHelper(
JSContext* cx, HandleLinearString str, const TextChar* text,
uint32_t textLen, char16_t patCh, HandleObjectGroup group) {
uint32_t count = 0;
for (size_t index = 0; index < textLen; index++) {
if (static_cast<char16_t>(text[index]) == patCh) {
count++;
}
}
if (count == 0) {
return SingleElementStringArray(cx, group, str);
}
RootedArrayObject splits(cx,
NewFullyAllocatedStringArray(cx, group, count + 1));
if (!splits) {
return nullptr;
}
splits->ensureDenseInitializedLength(cx, 0, count + 1);
uint32_t splitsIndex = 0;
size_t lastEndIndex = 0;
for (size_t index = 0; index < textLen; index++) {
if (static_cast<char16_t>(text[index]) == patCh) {
size_t subLength = size_t(index - lastEndIndex);
JSString* sub = NewDependentString(cx, str, lastEndIndex, subLength);
if (!sub) {
return nullptr;
}
splits->initDenseElement(splitsIndex++, StringValue(sub));
lastEndIndex = index + 1;
}
}
JSString* sub =
NewDependentString(cx, str, lastEndIndex, textLen - lastEndIndex);
if (!sub) {
return nullptr;
}
splits->initDenseElement(splitsIndex++, StringValue(sub));
return splits;
}
static ArrayObject* SplitSingleCharHelper(JSContext* cx, HandleLinearString str,
char16_t ch,
HandleObjectGroup group) {
size_t strLength = str->length();
AutoStableStringChars linearChars(cx);
if (!linearChars.init(cx, str)) {
return nullptr;
}
if (linearChars.isLatin1()) {
return SplitSingleCharHelper(cx, str, linearChars.latin1Chars(), strLength,
ch, group);
}
return SplitSingleCharHelper(cx, str, linearChars.twoByteChars(), strLength,
ch, group);
}
ArrayObject* js::StringSplitString(JSContext* cx, HandleObjectGroup group,
HandleString str, HandleString sep,
uint32_t limit) {
MOZ_ASSERT(limit > 0, "Only called for strictly positive limit.");
RootedLinearString linearStr(cx, str->ensureLinear(cx));
if (!linearStr) {
return nullptr;
}
RootedLinearString linearSep(cx, sep->ensureLinear(cx));
if (!linearSep) {
return nullptr;
}
if (linearSep->length() == 0) {
return CharSplitHelper(cx, linearStr, limit, group);
}
if (linearSep->length() == 1 && limit >= static_cast<uint32_t>(INT32_MAX)) {
char16_t ch = linearSep->latin1OrTwoByteChar(0);
return SplitSingleCharHelper(cx, linearStr, ch, group);
}
return SplitHelper(cx, linearStr, limit, linearSep, group);
}
bool js::str_concat(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
JSString* str = ToStringForStringFunction(cx, args.thisv());
if (!str) {
return false;
}
for (unsigned i = 0; i < args.length(); i++) {
JSString* argStr = ToString<NoGC>(cx, args[i]);
if (!argStr) {
RootedString strRoot(cx, str);
argStr = ToString<CanGC>(cx, args[i]);
if (!argStr) {
return false;
}
str = strRoot;
}
JSString* next = ConcatStrings<NoGC>(cx, str, argStr);
if (next) {
str = next;
} else {
RootedString strRoot(cx, str), argStrRoot(cx, argStr);
str = ConcatStrings<CanGC>(cx, strRoot, argStrRoot);
if (!str) {
return false;
}
}
}
args.rval().setString(str);
return true;
}
static const JSFunctionSpec string_methods[] = {
JS_FN(js_toSource_str, str_toSource, 0, 0),
JS_FN(js_toString_str, str_toString, 0, 0),
JS_FN(js_valueOf_str, str_toString, 0, 0),
JS_INLINABLE_FN("toLowerCase", str_toLowerCase, 0, 0, StringToLowerCase),
JS_INLINABLE_FN("toUpperCase", str_toUpperCase, 0, 0, StringToUpperCase),
JS_INLINABLE_FN("charAt", str_charAt, 1, 0, StringCharAt),
JS_INLINABLE_FN("charCodeAt", str_charCodeAt, 1, 0, StringCharCodeAt),
JS_SELF_HOSTED_FN("substring", "String_substring", 2, 0),
JS_SELF_HOSTED_FN("padStart", "String_pad_start", 2, 0),
JS_SELF_HOSTED_FN("padEnd", "String_pad_end", 2, 0),
JS_SELF_HOSTED_FN("codePointAt", "String_codePointAt", 1, 0),
JS_FN("includes", str_includes, 1, 0), JS_FN("indexOf", str_indexOf, 1, 0),
JS_FN("lastIndexOf", str_lastIndexOf, 1, 0),
JS_FN("startsWith", str_startsWith, 1, 0),
JS_FN("endsWith", str_endsWith, 1, 0), JS_FN("trim", str_trim, 0, 0),
JS_FN("trimStart", str_trimStart, 0, 0),
JS_FN("trimEnd", str_trimEnd, 0, 0),
#if EXPOSE_INTL_API
JS_SELF_HOSTED_FN("toLocaleLowerCase", "String_toLocaleLowerCase", 0, 0),
JS_SELF_HOSTED_FN("toLocaleUpperCase", "String_toLocaleUpperCase", 0, 0),
JS_SELF_HOSTED_FN("localeCompare", "String_localeCompare", 1, 0),
#else
JS_FN("toLocaleLowerCase", str_toLocaleLowerCase, 0, 0),
JS_FN("toLocaleUpperCase", str_toLocaleUpperCase, 0, 0),
JS_FN("localeCompare", str_localeCompare, 1, 0),
#endif
JS_SELF_HOSTED_FN("repeat", "String_repeat", 1, 0),
#if EXPOSE_INTL_API
JS_FN("normalize", str_normalize, 0, 0),
#endif
JS_SELF_HOSTED_FN("match", "String_match", 1, 0),
JS_SELF_HOSTED_FN("matchAll", "String_matchAll", 1, 0),
JS_SELF_HOSTED_FN("search", "String_search", 1, 0),
JS_SELF_HOSTED_FN("replace", "String_replace", 2, 0),
JS_SELF_HOSTED_FN("split", "String_split", 2, 0),
JS_SELF_HOSTED_FN("substr", "String_substr", 2, 0),
JS_FN("concat", str_concat, 1, 0),
JS_SELF_HOSTED_FN("slice", "String_slice", 2, 0),
JS_SELF_HOSTED_FN("bold", "String_bold", 0, 0),
JS_SELF_HOSTED_FN("italics", "String_italics", 0, 0),
JS_SELF_HOSTED_FN("fixed", "String_fixed", 0, 0),
JS_SELF_HOSTED_FN("strike", "String_strike", 0, 0),
JS_SELF_HOSTED_FN("small", "String_small", 0, 0),
JS_SELF_HOSTED_FN("big", "String_big", 0, 0),
JS_SELF_HOSTED_FN("blink", "String_blink", 0, 0),
JS_SELF_HOSTED_FN("sup", "String_sup", 0, 0),
JS_SELF_HOSTED_FN("sub", "String_sub", 0, 0),
JS_SELF_HOSTED_FN("anchor", "String_anchor", 1, 0),
JS_SELF_HOSTED_FN("link", "String_link", 1, 0),
JS_SELF_HOSTED_FN("fontcolor", "String_fontcolor", 1, 0),
JS_SELF_HOSTED_FN("fontsize", "String_fontsize", 1, 0),
JS_SELF_HOSTED_SYM_FN(iterator, "String_iterator", 0, 0), JS_FS_END};
bool js::StringConstructor(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedString str(cx);
if (args.length() > 0) {
if (!args.isConstructing() && args[0].isSymbol()) {
return js::SymbolDescriptiveString(cx, args[0].toSymbol(), args.rval());
}
str = ToString<CanGC>(cx, args[0]);
if (!str) {
return false;
}
} else {
str = cx->runtime()->emptyString;
}
if (args.isConstructing()) {
RootedObject proto(cx);
if (!GetPrototypeFromBuiltinConstructor(cx, args, JSProto_String, &proto)) {
return false;
}
StringObject* strobj = StringObject::create(cx, str, proto);
if (!strobj) {
return false;
}
args.rval().setObject(*strobj);
return true;
}
args.rval().setString(str);
return true;
}
bool js::str_fromCharCode(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
MOZ_ASSERT(args.length() <= ARGS_LENGTH_MAX);
if (args.length() == 1) {
return str_fromCharCode_one_arg(cx, args[0], args.rval());
}
InlineCharBuffer<char16_t> chars;
if (!chars.maybeAlloc(cx, args.length())) {
return false;
}
char16_t* rawChars = chars.get();
for (unsigned i = 0; i < args.length(); i++) {
uint16_t code;
if (!ToUint16(cx, args[i], &code)) {
return false;
}
rawChars[i] = char16_t(code);
}
JSString* str = chars.toString(cx, args.length());
if (!str) {
return false;
}
args.rval().setString(str);
return true;
}
static inline bool CodeUnitToString(JSContext* cx, uint16_t ucode,
MutableHandleValue rval) {
if (StaticStrings::hasUnit(ucode)) {
rval.setString(cx->staticStrings().getUnit(ucode));
return true;
}
char16_t c = char16_t(ucode);
JSString* str = NewStringCopyNDontDeflate<CanGC>(cx, &c, 1);
if (!str) {
return false;
}
rval.setString(str);
return true;
}
bool js::str_fromCharCode_one_arg(JSContext* cx, HandleValue code,
MutableHandleValue rval) {
uint16_t ucode;
if (!ToUint16(cx, code, &ucode)) {
return false;
}
return CodeUnitToString(cx, ucode, rval);
}
static MOZ_ALWAYS_INLINE bool ToCodePoint(JSContext* cx, HandleValue code,
uint32_t* codePoint) {
if (code.isInt32()) {
int32_t nextCP = code.toInt32();
if (nextCP >= 0 && nextCP <= int32_t(unicode::NonBMPMax)) {
*codePoint = uint32_t(nextCP);
return true;
}
}
double nextCP;
if (!ToNumber(cx, code, &nextCP)) {
return false;
}
if (JS::ToInteger(nextCP) != nextCP || nextCP < 0 ||
nextCP > unicode::NonBMPMax) {
ToCStringBuf cbuf;
if (const char* numStr = NumberToCString(cx, &cbuf, nextCP)) {
JS_ReportErrorNumberASCII(cx, GetErrorMessage, nullptr,
JSMSG_NOT_A_CODEPOINT, numStr);
}
return false;
}
*codePoint = uint32_t(nextCP);
return true;
}
bool js::str_fromCodePoint_one_arg(JSContext* cx, HandleValue code,
MutableHandleValue rval) {
uint32_t codePoint;
if (!ToCodePoint(cx, code, &codePoint)) {
return false;
}
if (!unicode::IsSupplementary(codePoint)) {
return CodeUnitToString(cx, uint16_t(codePoint), rval);
}
char16_t chars[] = {unicode::LeadSurrogate(codePoint),
unicode::TrailSurrogate(codePoint)};
JSString* str = NewStringCopyNDontDeflate<CanGC>(cx, chars, 2);
if (!str) {
return false;
}
rval.setString(str);
return true;
}
static bool str_fromCodePoint_few_args(JSContext* cx, const CallArgs& args) {
MOZ_ASSERT(args.length() <= JSFatInlineString::MAX_LENGTH_TWO_BYTE / 2);
char16_t elements[JSFatInlineString::MAX_LENGTH_TWO_BYTE];
unsigned length = 0;
for (unsigned nextIndex = 0; nextIndex < args.length(); nextIndex++) {
uint32_t codePoint;
if (!ToCodePoint(cx, args[nextIndex], &codePoint)) {
return false;
}
unicode::UTF16Encode(codePoint, elements, &length);
}
JSString* str = NewStringCopyN<CanGC>(cx, elements, length);
if (!str) {
return false;
}
args.rval().setString(str);
return true;
}
bool js::str_fromCodePoint(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
if (args.length() == 1) {
return str_fromCodePoint_one_arg(cx, args[0], args.rval());
}
if (args.length() <= JSFatInlineString::MAX_LENGTH_TWO_BYTE / 2) {
return str_fromCodePoint_few_args(cx, args);
}
static_assert(
ARGS_LENGTH_MAX < std::numeric_limits<decltype(args.length())>::max() / 2,
"|args.length() * 2 + 1| does not overflow");
auto elements = cx->make_pod_array<char16_t>(args.length() * 2 + 1);
if (!elements) {
return false;
}
unsigned length = 0;
for (unsigned nextIndex = 0; nextIndex < args.length(); nextIndex++) {
uint32_t codePoint;
if (!ToCodePoint(cx, args[nextIndex], &codePoint)) {
return false;
}
unicode::UTF16Encode(codePoint, elements.get(), &length);
}
elements[length] = 0;
JSString* str = NewString<CanGC>(cx, std::move(elements), length);
if (!str) {
return false;
}
args.rval().setString(str);
return true;
}
static const JSFunctionSpec string_static_methods[] = {
JS_INLINABLE_FN("fromCharCode", js::str_fromCharCode, 1, 0,
StringFromCharCode),
JS_INLINABLE_FN("fromCodePoint", js::str_fromCodePoint, 1, 0,
StringFromCodePoint),
JS_SELF_HOSTED_FN("raw", "String_static_raw", 1, 0),
JS_SELF_HOSTED_FN("substring", "String_static_substring", 3, 0),
JS_SELF_HOSTED_FN("substr", "String_static_substr", 3, 0),
JS_SELF_HOSTED_FN("slice", "String_static_slice", 3, 0),
JS_SELF_HOSTED_FN("match", "String_generic_match", 2, 0),
JS_SELF_HOSTED_FN("replace", "String_generic_replace", 3, 0),
JS_SELF_HOSTED_FN("search", "String_generic_search", 2, 0),
JS_SELF_HOSTED_FN("split", "String_generic_split", 3, 0),
JS_SELF_HOSTED_FN("toLowerCase", "String_static_toLowerCase", 1, 0),
JS_SELF_HOSTED_FN("toUpperCase", "String_static_toUpperCase", 1, 0),
JS_SELF_HOSTED_FN("charAt", "String_static_charAt", 2, 0),
JS_SELF_HOSTED_FN("charCodeAt", "String_static_charCodeAt", 2, 0),
JS_SELF_HOSTED_FN("includes", "String_static_includes", 2, 0),
JS_SELF_HOSTED_FN("indexOf", "String_static_indexOf", 2, 0),
JS_SELF_HOSTED_FN("lastIndexOf", "String_static_lastIndexOf", 2, 0),
JS_SELF_HOSTED_FN("startsWith", "String_static_startsWith", 2, 0),
JS_SELF_HOSTED_FN("endsWith", "String_static_endsWith", 2, 0),
JS_SELF_HOSTED_FN("trim", "String_static_trim", 1, 0),
JS_SELF_HOSTED_FN("trimLeft", "String_static_trimLeft", 1, 0),
JS_SELF_HOSTED_FN("trimRight", "String_static_trimRight", 1, 0),
JS_SELF_HOSTED_FN("toLocaleLowerCase", "String_static_toLocaleLowerCase", 1,
0),
JS_SELF_HOSTED_FN("toLocaleUpperCase", "String_static_toLocaleUpperCase", 1,
0),
#if EXPOSE_INTL_API
JS_SELF_HOSTED_FN("normalize", "String_static_normalize", 1, 0),
#endif
JS_SELF_HOSTED_FN("concat", "String_static_concat", 2, 0),
JS_SELF_HOSTED_FN("localeCompare", "String_static_localeCompare", 2, 0),
JS_FS_END};
Shape* StringObject::assignInitialShape(JSContext* cx,
Handle<StringObject*> obj) {
MOZ_ASSERT(obj->empty());
return NativeObject::addDataProperty(cx, obj, cx->names().length, LENGTH_SLOT,
JSPROP_PERMANENT | JSPROP_READONLY);
}
JSObject* js::InitStringClass(JSContext* cx, Handle<GlobalObject*> global) {
Rooted<JSString*> empty(cx, cx->runtime()->emptyString);
Rooted<StringObject*> proto(
cx, GlobalObject::createBlankPrototype<StringObject>(cx, global));
if (!proto) {
return nullptr;
}
if (!StringObject::init(cx, proto, empty)) {
return nullptr;
}
RootedFunction ctor(cx);
ctor = GlobalObject::createConstructor(
cx, StringConstructor, cx->names().String, 1, gc::AllocKind::FUNCTION,
&jit::JitInfo_String);
if (!ctor) {
return nullptr;
}
if (!LinkConstructorAndPrototype(cx, ctor, proto)) {
return nullptr;
}
if (!DefinePropertiesAndFunctions(cx, proto, nullptr, string_methods) ||
!DefinePropertiesAndFunctions(cx, ctor, nullptr, string_static_methods)) {
return nullptr;
}
RootedValue trimFn(cx);
RootedId trimId(cx, NameToId(cx->names().trimStart));
RootedId trimAliasId(cx, NameToId(cx->names().trimLeft));
if (!NativeGetProperty(cx, proto, trimId, &trimFn) ||
!NativeDefineDataProperty(cx, proto, trimAliasId, trimFn, 0)) {
return nullptr;
}
trimId = NameToId(cx->names().trimEnd);
trimAliasId = NameToId(cx->names().trimRight);
if (!NativeGetProperty(cx, proto, trimId, &trimFn) ||
!NativeDefineDataProperty(cx, proto, trimAliasId, trimFn, 0)) {
return nullptr;
}
if (!JS_DefineFunctions(cx, global, string_functions)) {
return nullptr;
}
if (!GlobalObject::initBuiltinConstructor(cx, global, JSProto_String, ctor,
proto)) {
return nullptr;
}
return proto;
}
#define ____ false
static const bool js_isUriReservedPlusPound[] = {
____, ____, ____, ____, ____, ____, ____, ____, ____, ____,
____, ____, ____, ____, ____, ____, ____, ____, ____, ____,
____, ____, ____, ____, ____, ____, ____, ____, ____, ____,
____, ____, ____, ____, ____, true, true, ____, true, ____,
____, ____, ____, true, true, ____, ____, true, ____, ____,
____, ____, ____, ____, ____, ____, ____, ____, true, true,
____, true, ____, true, true, ____, ____, ____, ____, ____,
____, ____, ____, ____, ____, ____, ____, ____, ____, ____,
____, ____, ____, ____, ____, ____, ____, ____, ____, ____,
____, ____, ____, ____, ____, ____, ____, ____, ____, ____,
____, ____, ____, ____, ____, ____, ____, ____, ____, ____,
____, ____, ____, ____, ____, ____, ____, ____, ____, ____,
____, ____, ____, ____, ____, ____, ____, ____
};
static const bool js_isUriUnescaped[] = {
____, ____, ____, ____, ____, ____, ____, ____, ____, ____,
____, ____, ____, ____, ____, ____, ____, ____, ____, ____,
____, ____, ____, ____, ____, ____, ____, ____, ____, ____,
____, ____, ____, true, ____, ____, ____, ____, ____, true,
true, true, true, ____, ____, true, true, ____, true, true,
true, true, true, true, true, true, true, true, ____, ____,
____, ____, ____, ____, ____, true, true, true, true, true,
true, true, true, true, true, true, true, true, true, true,
true, true, true, true, true, true, true, true, true, true,
true, ____, ____, ____, ____, true, ____, true, true, true,
true, true, true, true, true, true, true, true, true, true,
true, true, true, true, true, true, true, true, true, true,
true, true, true, ____, ____, ____, true, ____
};
#undef ____
static inline bool TransferBufferToString(StringBuffer& sb, JSString* str,
MutableHandleValue rval) {
if (!sb.empty()) {
str = sb.finishString();
if (!str) {
return false;
}
}
rval.setString(str);
return true;
}
enum EncodeResult { Encode_Failure, Encode_BadUri, Encode_Success };
template <typename CharT>
static MOZ_NEVER_INLINE EncodeResult Encode(StringBuffer& sb,
const CharT* chars, size_t length,
const bool* unescapedSet) {
Latin1Char hexBuf[3];
hexBuf[0] = '%';
auto appendEncoded = [&sb, &hexBuf](Latin1Char c) {
static const char HexDigits[] = "0123456789ABCDEF";
hexBuf[1] = HexDigits[c >> 4];
hexBuf[2] = HexDigits[c & 0xf];
return sb.append(hexBuf, 3);
};
auto appendRange = [&sb, chars, length](size_t start, size_t end) {
MOZ_ASSERT(start <= end);
if (start < end) {
if (start == 0) {
if (!sb.reserve(length)) {
return false;
}
}
return sb.append(chars + start, chars + end);
}
return true;
};
size_t startAppend = 0;
for (size_t k = 0; k < length; k++) {
CharT c = chars[k];
if (c < 128 &&
(js_isUriUnescaped[c] || (unescapedSet && unescapedSet[c]))) {
continue;
} else {
if (!appendRange(startAppend, k)) {
return Encode_Failure;
}
if (mozilla::IsSame<CharT, Latin1Char>::value) {
if (c < 0x80) {
if (!appendEncoded(c)) {
return Encode_Failure;
}
} else {
if (!appendEncoded(0xC0 | (c >> 6)) ||
!appendEncoded(0x80 | (c & 0x3F))) {
return Encode_Failure;
}
}
} else {
if (unicode::IsTrailSurrogate(c)) {
return Encode_BadUri;
}
uint32_t v;
if (!unicode::IsLeadSurrogate(c)) {
v = c;
} else {
k++;
if (k == length) {
return Encode_BadUri;
}
char16_t c2 = chars[k];
if (!unicode::IsTrailSurrogate(c2)) {
return Encode_BadUri;
}
v = unicode::UTF16Decode(c, c2);
}
uint8_t utf8buf[4];
size_t L = OneUcs4ToUtf8Char(utf8buf, v);
for (size_t j = 0; j < L; j++) {
if (!appendEncoded(utf8buf[j])) {
return Encode_Failure;
}
}
}
startAppend = k + 1;
}
}
if (startAppend > 0) {
if (!appendRange(startAppend, length)) {
return Encode_Failure;
}
}
return Encode_Success;
}
static MOZ_ALWAYS_INLINE bool Encode(JSContext* cx, HandleLinearString str,
const bool* unescapedSet,
MutableHandleValue rval) {
size_t length = str->length();
if (length == 0) {
rval.setString(cx->runtime()->emptyString);
return true;
}
StringBuffer sb(cx);
EncodeResult res;
if (str->hasLatin1Chars()) {
AutoCheckCannotGC nogc;
res = Encode(sb, str->latin1Chars(nogc), str->length(), unescapedSet);
} else {
AutoCheckCannotGC nogc;
res = Encode(sb, str->twoByteChars(nogc), str->length(), unescapedSet);
}
if (res == Encode_Failure) {
return false;
}
if (res == Encode_BadUri) {
JS_ReportErrorNumberASCII(cx, GetErrorMessage, nullptr, JSMSG_BAD_URI);
return false;
}
MOZ_ASSERT(res == Encode_Success);
return TransferBufferToString(sb, str, rval);
}
enum DecodeResult { Decode_Failure, Decode_BadUri, Decode_Success };
template <typename CharT>
static DecodeResult Decode(StringBuffer& sb, const CharT* chars, size_t length,
const bool* reservedSet) {
auto appendRange = [&sb, chars](size_t start, size_t end) {
MOZ_ASSERT(start <= end);
if (start < end) {
return sb.append(chars + start, chars + end);
}
return true;
};
size_t startAppend = 0;
for (size_t k = 0; k < length; k++) {
CharT c = chars[k];
if (c == '%') {
size_t start = k;
if ((k + 2) >= length) {
return Decode_BadUri;
}
if (!JS7_ISHEX(chars[k + 1]) || !JS7_ISHEX(chars[k + 2])) {
return Decode_BadUri;
}
uint32_t B = JS7_UNHEX(chars[k + 1]) * 16 + JS7_UNHEX(chars[k + 2]);
k += 2;
if (B < 128) {
Latin1Char ch = Latin1Char(B);
if (reservedSet && reservedSet[ch]) {
continue;
}
if (!appendRange(startAppend, start)) {
return Decode_Failure;
}
if (!sb.append(ch)) {
return Decode_Failure;
}
} else {
int n = 1;
while (B & (0x80 >> n)) {
n++;
}
if (n == 1 || n > 4) {
return Decode_BadUri;
}
uint8_t octets[4];
octets[0] = (uint8_t)B;
if (k + 3 * (n - 1) >= length) {
return Decode_BadUri;
}
for (int j = 1; j < n; j++) {
k++;
if (chars[k] != '%') {
return Decode_BadUri;
}
if (!JS7_ISHEX(chars[k + 1]) || !JS7_ISHEX(chars[k + 2])) {
return Decode_BadUri;
}
B = JS7_UNHEX(chars[k + 1]) * 16 + JS7_UNHEX(chars[k + 2]);
if ((B & 0xC0) != 0x80) {
return Decode_BadUri;
}
k += 2;
octets[j] = char(B);
}
if (!appendRange(startAppend, start)) {
return Decode_Failure;
}
uint32_t v = JS::Utf8ToOneUcs4Char(octets, n);
MOZ_ASSERT(v >= 128);
if (v >= unicode::NonBMPMin) {
if (v > unicode::NonBMPMax) {
return Decode_BadUri;
}
if (!sb.append(unicode::LeadSurrogate(v))) {
return Decode_Failure;
}
if (!sb.append(unicode::TrailSurrogate(v))) {
return Decode_Failure;
}
} else {
if (!sb.append(char16_t(v))) {
return Decode_Failure;
}
}
}
startAppend = k + 1;
}
}
if (startAppend > 0) {
if (!appendRange(startAppend, length)) {
return Decode_Failure;
}
}
return Decode_Success;
}
static bool Decode(JSContext* cx, HandleLinearString str,
const bool* reservedSet, MutableHandleValue rval) {
size_t length = str->length();
if (length == 0) {
rval.setString(cx->runtime()->emptyString);
return true;
}
StringBuffer sb(cx);
DecodeResult res;
if (str->hasLatin1Chars()) {
AutoCheckCannotGC nogc;
res = Decode(sb, str->latin1Chars(nogc), str->length(), reservedSet);
} else {
AutoCheckCannotGC nogc;
res = Decode(sb, str->twoByteChars(nogc), str->length(), reservedSet);
}
if (res == Decode_Failure) {
return false;
}
if (res == Decode_BadUri) {
JS_ReportErrorNumberASCII(cx, GetErrorMessage, nullptr, JSMSG_BAD_URI);
return false;
}
MOZ_ASSERT(res == Decode_Success);
return TransferBufferToString(sb, str, rval);
}
static bool str_decodeURI(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedLinearString str(cx, ArgToLinearString(cx, args, 0));
if (!str) {
return false;
}
return Decode(cx, str, js_isUriReservedPlusPound, args.rval());
}
static bool str_decodeURI_Component(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedLinearString str(cx, ArgToLinearString(cx, args, 0));
if (!str) {
return false;
}
return Decode(cx, str, nullptr, args.rval());
}
static bool str_encodeURI(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedLinearString str(cx, ArgToLinearString(cx, args, 0));
if (!str) {
return false;
}
return Encode(cx, str, js_isUriReservedPlusPound, args.rval());
}
static bool str_encodeURI_Component(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
RootedLinearString str(cx, ArgToLinearString(cx, args, 0));
if (!str) {
return false;
}
return Encode(cx, str, nullptr, args.rval());
}
JSString* js::EncodeURI(JSContext* cx, const char* chars, size_t length) {
StringBuffer sb(cx);
EncodeResult result = Encode(sb, reinterpret_cast<const Latin1Char*>(chars),
length, js_isUriReservedPlusPound);
if (result == EncodeResult::Encode_Failure) {
return nullptr;
}
if (result == EncodeResult::Encode_BadUri) {
JS_ReportErrorNumberASCII(cx, GetErrorMessage, nullptr, JSMSG_BAD_URI);
return nullptr;
}
if (sb.empty()) {
return NewStringCopyN<CanGC>(cx, chars, length);
}
return sb.finishString();
}
static bool FlatStringMatchHelper(JSContext* cx, HandleString str,
HandleString pattern, bool* isFlat,
int32_t* match) {
RootedLinearString linearPattern(cx, pattern->ensureLinear(cx));
if (!linearPattern) {
return false;
}
static const size_t MAX_FLAT_PAT_LEN = 256;
if (linearPattern->length() > MAX_FLAT_PAT_LEN ||
StringHasRegExpMetaChars(linearPattern)) {
*isFlat = false;
return true;
}
*isFlat = true;
if (str->isRope()) {
if (!RopeMatch(cx, &str->asRope(), linearPattern, match)) {
return false;
}
} else {
*match = StringMatch(&str->asLinear(), linearPattern);
}
return true;
}
static bool BuildFlatMatchArray(JSContext* cx, HandleString str,
HandleString pattern, int32_t match,
MutableHandleValue rval) {
if (match < 0) {
rval.setNull();
return true;
}
JSObject* templateObject =
cx->realm()->regExps.getOrCreateMatchResultTemplateObject(cx);
if (!templateObject) {
return false;
}
RootedArrayObject arr(
cx, NewDenseFullyAllocatedArrayWithTemplate(cx, 1, templateObject));
if (!arr) {
return false;
}
arr->setDenseInitializedLength(1);
arr->initDenseElement(0, StringValue(pattern));
arr->setSlot(0, Int32Value(match));
arr->setSlot(1, StringValue(str));
#ifdef DEBUG
RootedValue test(cx);
RootedId id(cx, NameToId(cx->names().index));
if (!NativeGetProperty(cx, arr, id, &test)) {
return false;
}
MOZ_ASSERT(test == arr->getSlot(0));
id = NameToId(cx->names().input);
if (!NativeGetProperty(cx, arr, id, &test)) {
return false;
}
MOZ_ASSERT(test == arr->getSlot(1));
#endif
rval.setObject(*arr);
return true;
}
#ifdef DEBUG
static bool CallIsStringOptimizable(JSContext* cx, const char* name,
bool* result) {
FixedInvokeArgs<0> args(cx);
RootedValue rval(cx);
if (!CallSelfHostedFunction(cx, name, UndefinedHandleValue, args, &rval)) {
return false;
}
*result = rval.toBoolean();
return true;
}
#endif
bool js::FlatStringMatch(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
MOZ_ASSERT(args.length() == 2);
MOZ_ASSERT(args[0].isString());
MOZ_ASSERT(args[1].isString());
#ifdef DEBUG
bool isOptimizable = false;
if (!CallIsStringOptimizable(cx, "IsStringMatchOptimizable",
&isOptimizable)) {
return false;
}
MOZ_ASSERT(isOptimizable);
#endif
RootedString str(cx, args[0].toString());
RootedString pattern(cx, args[1].toString());
bool isFlat = false;
int32_t match = 0;
if (!FlatStringMatchHelper(cx, str, pattern, &isFlat, &match)) {
return false;
}
if (!isFlat) {
args.rval().setUndefined();
return true;
}
return BuildFlatMatchArray(cx, str, pattern, match, args.rval());
}
bool js::FlatStringSearch(JSContext* cx, unsigned argc, Value* vp) {
CallArgs args = CallArgsFromVp(argc, vp);
MOZ_ASSERT(args.length() == 2);
MOZ_ASSERT(args[0].isString());
MOZ_ASSERT(args[1].isString());
#ifdef DEBUG
bool isOptimizable = false;
if (!CallIsStringOptimizable(cx, "IsStringSearchOptimizable",
&isOptimizable)) {
return false;
}
MOZ_ASSERT(isOptimizable);
#endif
RootedString str(cx, args[0].toString());
RootedString pattern(cx, args[1].toString());
bool isFlat = false;
int32_t match = 0;
if (!FlatStringMatchHelper(cx, str, pattern, &isFlat, &match)) {
return false;
}
if (!isFlat) {
args.rval().setInt32(-2);
return true;
}
args.rval().setInt32(match);
return true;
}