/**************************************************************************** ** ** Copyright (C) 2014 Digia Plc and/or its subsidiary(-ies). ** Contact: http://www.qt-project.org/legal ** ** This file is part of the QtQml module of the Qt Toolkit. ** ** $QT_BEGIN_LICENSE:LGPL21$ ** Commercial License Usage ** Licensees holding valid commercial Qt licenses may use this file in ** accordance with the commercial license agreement provided with the ** Software or, alternatively, in accordance with the terms contained in ** a written agreement between you and Digia. For licensing terms and ** conditions see http://qt.digia.com/licensing. For further information ** use the contact form at http://qt.digia.com/contact-us. ** ** GNU Lesser General Public License Usage ** Alternatively, this file may be used under the terms of the GNU Lesser ** General Public License version 2.1 or version 3 as published by the Free ** Software Foundation and appearing in the file LICENSE.LGPLv21 and ** LICENSE.LGPLv3 included in the packaging of this file. Please review the ** following information to ensure the GNU Lesser General Public License ** requirements will be met: https://www.gnu.org/licenses/lgpl.html and ** http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html. ** ** In addition, as a special exception, Digia gives you certain additional ** rights. These rights are described in the Digia Qt LGPL Exception ** version 1.1, included in the file LGPL_EXCEPTION.txt in this package. ** ** $QT_END_LICENSE$ ** ****************************************************************************/ #include "qv4regexpobject_p.h" #include "qv4jsir_p.h" #include "qv4isel_p.h" #include "qv4objectproto_p.h" #include "qv4stringobject_p.h" #include "qv4mm_p.h" #include "qv4scopedvalue_p.h" #include #include #include #include #include #include #include "private/qlocale_tools_p.h" #include #include #include #include #include #include #include "qv4alloca_p.h" QT_BEGIN_NAMESPACE Q_CORE_EXPORT QString qt_regexp_toCanonical(const QString &, QRegExp::PatternSyntax); using namespace QV4; DEFINE_OBJECT_VTABLE(RegExpObject); DEFINE_OBJECT_VTABLE(RegExpPrototype); RegExpObject::Data::Data(InternalClass *ic) : Object::Data(ic) { setVTable(staticVTable()); Scope scope(ic->engine); Scoped o(scope, this); o->d()->value = reinterpret_cast(RegExp::create(ic->engine, QString(), false, false)); o->d()->global = false; o->init(ic->engine); } RegExpObject::Data::Data(ExecutionEngine *engine, RegExp *value, bool global) : Object::Data(engine->regExpClass) , value(value) , global(global) { setVTable(staticVTable()); Scope scope(engine); Scoped o(scope, this); o->init(engine); } // Converts a QRegExp to a JS RegExp. // The conversion is not 100% exact since ECMA regexp and QRegExp // have different semantics/flags, but we try to do our best. RegExpObject::Data::Data(ExecutionEngine *engine, const QRegExp &re) : Object::Data(engine->regExpClass) { setVTable(staticVTable()); value = 0; global = false; // Convert the pattern to a ECMAScript pattern. QString pattern = QT_PREPEND_NAMESPACE(qt_regexp_toCanonical)(re.pattern(), re.patternSyntax()); if (re.isMinimal()) { QString ecmaPattern; int len = pattern.length(); ecmaPattern.reserve(len); int i = 0; const QChar *wc = pattern.unicode(); bool inBracket = false; while (i < len) { QChar c = wc[i++]; ecmaPattern += c; switch (c.unicode()) { case '?': case '+': case '*': case '}': if (!inBracket) ecmaPattern += QLatin1Char('?'); break; case '\\': if (i < len) ecmaPattern += wc[i++]; break; case '[': inBracket = true; break; case ']': inBracket = false; break; default: break; } } pattern = ecmaPattern; } Scope scope(engine); Scoped o(scope, this); o->d()->value = reinterpret_cast(RegExp::create(engine, pattern, re.caseSensitivity() == Qt::CaseInsensitive, false)); o->init(engine); } void RegExpObject::init(ExecutionEngine *engine) { Scope scope(engine); ScopedObject protectThis(scope, this); ScopedString lastIndex(scope, engine->newIdentifier(QStringLiteral("lastIndex"))); ScopedValue v(scope, Primitive::fromInt32(0)); insertMember(lastIndex.getPointer(), v, Attr_NotEnumerable|Attr_NotConfigurable); if (!this->value()) return; QString p = this->value()->pattern(); if (p.isEmpty()) { p = QStringLiteral("(?:)"); } else { // escape certain parts, see ch. 15.10.4 p.replace('/', QLatin1String("\\/")); } defineReadonlyProperty(QStringLiteral("source"), (v = engine->newString(p))); defineReadonlyProperty(QStringLiteral("global"), Primitive::fromBoolean(global())); defineReadonlyProperty(QStringLiteral("ignoreCase"), Primitive::fromBoolean(this->value()->ignoreCase())); defineReadonlyProperty(QStringLiteral("multiline"), Primitive::fromBoolean(this->value()->multiLine())); } void RegExpObject::markObjects(Managed *that, ExecutionEngine *e) { RegExpObject *re = static_cast(that); if (re->value()) re->value()->mark(e); Object::markObjects(that, e); } Property *RegExpObject::lastIndexProperty(ExecutionContext *ctx) { Q_UNUSED(ctx); Q_ASSERT(0 == internalClass()->find(ctx->d()->engine->newIdentifier(QStringLiteral("lastIndex")))); return propertyAt(0); } // Converts a JS RegExp to a QRegExp. // The conversion is not 100% exact since ECMA regexp and QRegExp // have different semantics/flags, but we try to do our best. QRegExp RegExpObject::toQRegExp() const { Qt::CaseSensitivity caseSensitivity = value()->ignoreCase() ? Qt::CaseInsensitive : Qt::CaseSensitive; return QRegExp(value()->pattern(), caseSensitivity, QRegExp::RegExp2); } QString RegExpObject::toString() const { QString result = QLatin1Char('/') + source(); result += QLatin1Char('/'); if (global()) result += QLatin1Char('g'); if (value()->ignoreCase()) result += QLatin1Char('i'); if (value()->multiLine()) result += QLatin1Char('m'); return result; } QString RegExpObject::source() const { Scope scope(engine()); ScopedString source(scope, scope.engine->newIdentifier(QStringLiteral("source"))); ScopedValue s(scope, const_cast(this)->get(source.getPointer())); return s->toQString(); } uint RegExpObject::flags() const { uint f = 0; if (global()) f |= QV4::RegExpObject::RegExp_Global; if (value()->ignoreCase()) f |= QV4::RegExpObject::RegExp_IgnoreCase; if (value()->multiLine()) f |= QV4::RegExpObject::RegExp_Multiline; return f; } DEFINE_OBJECT_VTABLE(RegExpCtor); RegExpCtor::Data::Data(ExecutionContext *scope) : FunctionObject::Data(scope, QStringLiteral("RegExp")) { setVTable(staticVTable()); clearLastMatch(); } void RegExpCtor::Data::clearLastMatch() { lastMatch = Primitive::nullValue(); lastInput = internalClass->engine->id_empty; lastMatchStart = 0; lastMatchEnd = 0; } ReturnedValue RegExpCtor::construct(Managed *m, CallData *callData) { ExecutionContext *ctx = m->engine()->currentContext(); Scope scope(ctx); ScopedValue r(scope, callData->argument(0)); ScopedValue f(scope, callData->argument(1)); Scoped re(scope, r); if (re) { if (!f->isUndefined()) return ctx->throwTypeError(); return Encode(ctx->d()->engine->newRegExpObject(re->value(), re->global())); } QString pattern; if (!r->isUndefined()) pattern = r->toString(ctx)->toQString(); if (scope.hasException()) return Encode::undefined(); bool global = false; bool ignoreCase = false; bool multiLine = false; if (!f->isUndefined()) { f = RuntimeHelpers::toString(ctx, f); if (scope.hasException()) return Encode::undefined(); QString str = f->stringValue()->toQString(); for (int i = 0; i < str.length(); ++i) { if (str.at(i) == QLatin1Char('g') && !global) { global = true; } else if (str.at(i) == QLatin1Char('i') && !ignoreCase) { ignoreCase = true; } else if (str.at(i) == QLatin1Char('m') && !multiLine) { multiLine = true; } else { return ctx->throwSyntaxError(QStringLiteral("Invalid flags supplied to RegExp constructor")); } } } RegExp *regexp = reinterpret_cast(RegExp::create(ctx->d()->engine, pattern, ignoreCase, multiLine)); if (!regexp->isValid()) return ctx->throwSyntaxError(QStringLiteral("Invalid regular expression")); return Encode(ctx->d()->engine->newRegExpObject(regexp, global)); } ReturnedValue RegExpCtor::call(Managed *that, CallData *callData) { if (callData->argc > 0 && callData->args[0].as()) { if (callData->argc == 1 || callData->args[1].isUndefined()) return callData->args[0].asReturnedValue(); } return construct(that, callData); } void RegExpCtor::markObjects(Managed *that, ExecutionEngine *e) { RegExpCtor *This = static_cast(that); This->lastMatch().mark(e); This->lastInput().mark(e); FunctionObject::markObjects(that, e); } void RegExpPrototype::init(ExecutionEngine *engine, Object *constructor) { Scope scope(engine); ScopedObject o(scope); ScopedObject ctor(scope, constructor); ctor->defineReadonlyProperty(engine->id_prototype, (o = this)); ctor->defineReadonlyProperty(engine->id_length, Primitive::fromInt32(2)); // Properties deprecated in the spec but required by "the web" :( ctor->defineAccessorProperty(QStringLiteral("lastMatch"), method_get_lastMatch_n<0>, 0); ctor->defineAccessorProperty(QStringLiteral("$&"), method_get_lastMatch_n<0>, 0); ctor->defineAccessorProperty(QStringLiteral("$1"), method_get_lastMatch_n<1>, 0); ctor->defineAccessorProperty(QStringLiteral("$2"), method_get_lastMatch_n<2>, 0); ctor->defineAccessorProperty(QStringLiteral("$3"), method_get_lastMatch_n<3>, 0); ctor->defineAccessorProperty(QStringLiteral("$4"), method_get_lastMatch_n<4>, 0); ctor->defineAccessorProperty(QStringLiteral("$5"), method_get_lastMatch_n<5>, 0); ctor->defineAccessorProperty(QStringLiteral("$6"), method_get_lastMatch_n<6>, 0); ctor->defineAccessorProperty(QStringLiteral("$7"), method_get_lastMatch_n<7>, 0); ctor->defineAccessorProperty(QStringLiteral("$8"), method_get_lastMatch_n<8>, 0); ctor->defineAccessorProperty(QStringLiteral("$9"), method_get_lastMatch_n<9>, 0); ctor->defineAccessorProperty(QStringLiteral("lastParen"), method_get_lastParen, 0); ctor->defineAccessorProperty(QStringLiteral("$+"), method_get_lastParen, 0); ctor->defineAccessorProperty(QStringLiteral("input"), method_get_input, 0); ctor->defineAccessorProperty(QStringLiteral("$_"), method_get_input, 0); ctor->defineAccessorProperty(QStringLiteral("leftContext"), method_get_leftContext, 0); ctor->defineAccessorProperty(QStringLiteral("$`"), method_get_leftContext, 0); ctor->defineAccessorProperty(QStringLiteral("rightContext"), method_get_rightContext, 0); ctor->defineAccessorProperty(QStringLiteral("$'"), method_get_rightContext, 0); defineDefaultProperty(QStringLiteral("constructor"), (o = ctor)); defineDefaultProperty(QStringLiteral("exec"), method_exec, 1); defineDefaultProperty(QStringLiteral("test"), method_test, 1); defineDefaultProperty(engine->id_toString, method_toString, 0); defineDefaultProperty(QStringLiteral("compile"), method_compile, 2); } ReturnedValue RegExpPrototype::method_exec(CallContext *ctx) { Scope scope(ctx); Scoped r(scope, ctx->d()->callData->thisObject.as()); if (!r) return ctx->throwTypeError(); ScopedValue arg(scope, ctx->argument(0)); arg = RuntimeHelpers::toString(ctx, arg); if (scope.hasException()) return Encode::undefined(); QString s = arg->stringValue()->toQString(); int offset = r->global() ? r->lastIndexProperty(ctx)->value.toInt32() : 0; if (offset < 0 || offset > s.length()) { r->lastIndexProperty(ctx)->value = Primitive::fromInt32(0); return Encode::null(); } uint* matchOffsets = (uint*)alloca(r->value()->captureCount() * 2 * sizeof(uint)); const int result = r->value()->match(s, offset, matchOffsets); Scoped regExpCtor(scope, ctx->d()->engine->regExpCtor); regExpCtor->d()->clearLastMatch(); if (result == -1) { r->lastIndexProperty(ctx)->value = Primitive::fromInt32(0); return Encode::null(); } // fill in result data Scoped array(scope, ctx->d()->engine->newArrayObject(ctx->d()->engine->regExpExecArrayClass)); int len = r->value()->captureCount(); array->arrayReserve(len); ScopedValue v(scope); for (int i = 0; i < len; ++i) { int start = matchOffsets[i * 2]; int end = matchOffsets[i * 2 + 1]; v = (start != -1 && end != -1) ? ctx->d()->engine->newString(s.mid(start, end - start))->asReturnedValue() : Encode::undefined(); array->arrayPut(i, v); } array->setArrayLengthUnchecked(len); array->memberData()[Index_ArrayIndex] = Primitive::fromInt32(result); array->memberData()[Index_ArrayInput] = arg.asReturnedValue(); RegExpCtor::Data *dd = regExpCtor->d(); dd->lastMatch = array; dd->lastInput = arg->stringValue(); dd->lastMatchStart = matchOffsets[0]; dd->lastMatchEnd = matchOffsets[1]; if (r->global()) r->lastIndexProperty(ctx)->value = Primitive::fromInt32(matchOffsets[1]); return array.asReturnedValue(); } ReturnedValue RegExpPrototype::method_test(CallContext *ctx) { Scope scope(ctx); ScopedValue r(scope, method_exec(ctx)); return Encode(!r->isNull()); } ReturnedValue RegExpPrototype::method_toString(CallContext *ctx) { Scope scope(ctx); Scoped r(scope, ctx->d()->callData->thisObject.as()); if (!r) return ctx->throwTypeError(); return ctx->d()->engine->newString(r->toString())->asReturnedValue(); } ReturnedValue RegExpPrototype::method_compile(CallContext *ctx) { Scope scope(ctx); Scoped r(scope, ctx->d()->callData->thisObject.as()); if (!r) return ctx->throwTypeError(); ScopedCallData callData(scope, ctx->d()->callData->argc); memcpy(callData->args, ctx->d()->callData->args, ctx->d()->callData->argc*sizeof(Value)); Scoped re(scope, ctx->d()->engine->regExpCtor.asFunctionObject()->construct(callData)); r->d()->value = re->value(); r->d()->global = re->global(); return Encode::undefined(); } template ReturnedValue RegExpPrototype::method_get_lastMatch_n(CallContext *ctx) { Scope scope(ctx); ScopedArrayObject lastMatch(scope, static_cast(ctx->d()->engine->regExpCtor.objectValue())->lastMatch()); ScopedValue result(scope, lastMatch ? lastMatch->getIndexed(index) : Encode::undefined()); if (result->isUndefined()) return ctx->d()->engine->newString(QString())->asReturnedValue(); return result.asReturnedValue(); } ReturnedValue RegExpPrototype::method_get_lastParen(CallContext *ctx) { Scope scope(ctx); ScopedArrayObject lastMatch(scope, static_cast(ctx->d()->engine->regExpCtor.objectValue())->lastMatch()); ScopedValue result(scope, lastMatch ? lastMatch->getIndexed(lastMatch->getLength() - 1) : Encode::undefined()); if (result->isUndefined()) return ctx->d()->engine->newString(QString())->asReturnedValue(); return result.asReturnedValue(); } ReturnedValue RegExpPrototype::method_get_input(CallContext *ctx) { return static_cast(ctx->d()->engine->regExpCtor.objectValue())->lastInput().asReturnedValue(); } ReturnedValue RegExpPrototype::method_get_leftContext(CallContext *ctx) { Scope scope(ctx); Scoped regExpCtor(scope, ctx->d()->engine->regExpCtor); QString lastInput = regExpCtor->lastInput()->toQString(); return ctx->d()->engine->newString(lastInput.left(regExpCtor->lastMatchStart()))->asReturnedValue(); } ReturnedValue RegExpPrototype::method_get_rightContext(CallContext *ctx) { Scope scope(ctx); Scoped regExpCtor(scope, ctx->d()->engine->regExpCtor); QString lastInput = regExpCtor->lastInput()->toQString(); return ctx->d()->engine->newString(lastInput.mid(regExpCtor->lastMatchEnd()))->asReturnedValue(); } QT_END_NAMESPACE