/**************************************************************************** ** ** Copyright (C) 2013 Digia Plc and/or its subsidiary(-ies). ** Contact: http://www.qt-project.org/legal ** ** This file is part of the QtQml module of the Qt Toolkit. ** ** $QT_BEGIN_LICENSE:LGPL$ ** Commercial License Usage ** Licensees holding valid commercial Qt licenses may use this file in ** accordance with the commercial license agreement provided with the ** Software or, alternatively, in accordance with the terms contained in ** a written agreement between you and Digia. For licensing terms and ** conditions see http://qt.digia.com/licensing. For further information ** use the contact form at http://qt.digia.com/contact-us. ** ** GNU Lesser General Public License Usage ** Alternatively, this file may be used under the terms of the GNU Lesser ** General Public License version 2.1 as published by the Free Software ** Foundation and appearing in the file LICENSE.LGPL included in the ** packaging of this file. Please review the following information to ** ensure the GNU Lesser General Public License version 2.1 requirements ** will be met: http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html. ** ** In addition, as a special exception, Digia gives you certain additional ** rights. These rights are described in the Digia Qt LGPL Exception ** version 1.1, included in the file LGPL_EXCEPTION.txt in this package. ** ** GNU General Public License Usage ** Alternatively, this file may be used under the terms of the GNU ** General Public License version 3.0 as published by the Free Software ** Foundation and appearing in the file LICENSE.GPL included in the ** packaging of this file. Please review the following information to ** ensure the GNU General Public License version 3.0 requirements will be ** met: http://www.gnu.org/copyleft/gpl.html. ** ** ** $QT_END_LICENSE$ ** ****************************************************************************/ #include "qv4regexpobject_p.h" #include "qv4jsir_p.h" #include "qv4isel_p.h" #include "qv4objectproto_p.h" #include "qv4stringobject_p.h" #include "qv4mm_p.h" #include "qv4scopedvalue_p.h" #include #include #include #include #include #include #include "private/qlocale_tools_p.h" #include #include #include #include #include #include #include "qv4alloca_p.h" QT_BEGIN_NAMESPACE Q_CORE_EXPORT QString qt_regexp_toCanonical(const QString &, QRegExp::PatternSyntax); using namespace QV4; DEFINE_OBJECT_VTABLE(RegExpObject); RegExpObject::RegExpObject(InternalClass *ic) : Object(ic) { d()->value = RegExp::create(ic->engine, QString(), false, false); d()->global = false; Q_ASSERT(internalClass()->vtable == staticVTable()); init(ic->engine); } RegExpObject::RegExpObject(ExecutionEngine *engine, RegExpRef value, bool global) : Object(engine->regExpClass) { d()->value = value; d()->global = global; init(engine); } // Converts a QRegExp to a JS RegExp. // The conversion is not 100% exact since ECMA regexp and QRegExp // have different semantics/flags, but we try to do our best. RegExpObject::RegExpObject(ExecutionEngine *engine, const QRegExp &re) : Object(engine->regExpClass) { d()->value = 0; d()->global = false; // Convert the pattern to a ECMAScript pattern. QString pattern = QT_PREPEND_NAMESPACE(qt_regexp_toCanonical)(re.pattern(), re.patternSyntax()); if (re.isMinimal()) { QString ecmaPattern; int len = pattern.length(); ecmaPattern.reserve(len); int i = 0; const QChar *wc = pattern.unicode(); bool inBracket = false; while (i < len) { QChar c = wc[i++]; ecmaPattern += c; switch (c.unicode()) { case '?': case '+': case '*': case '}': if (!inBracket) ecmaPattern += QLatin1Char('?'); break; case '\\': if (i < len) ecmaPattern += wc[i++]; break; case '[': inBracket = true; break; case ']': inBracket = false; break; default: break; } } pattern = ecmaPattern; } Scope scope(engine); ScopedObject protectThis(scope, this); d()->value = RegExp::create(engine, pattern, re.caseSensitivity() == Qt::CaseInsensitive, false); init(engine); } void RegExpObject::init(ExecutionEngine *engine) { setVTable(staticVTable()); Scope scope(engine); ScopedObject protectThis(scope, this); ScopedString lastIndex(scope, engine->newIdentifier(QStringLiteral("lastIndex"))); ScopedValue v(scope, Primitive::fromInt32(0)); insertMember(lastIndex.getPointer(), v, Attr_NotEnumerable|Attr_NotConfigurable); if (!this->value()) return; QString p = this->value()->pattern(); if (p.isEmpty()) { p = QStringLiteral("(?:)"); } else { // escape certain parts, see ch. 15.10.4 p.replace('/', QLatin1String("\\/")); } defineReadonlyProperty(QStringLiteral("source"), (v = engine->newString(p))); defineReadonlyProperty(QStringLiteral("global"), Primitive::fromBoolean(global())); defineReadonlyProperty(QStringLiteral("ignoreCase"), Primitive::fromBoolean(this->value()->ignoreCase())); defineReadonlyProperty(QStringLiteral("multiline"), Primitive::fromBoolean(this->value()->multiLine())); } void RegExpObject::markObjects(Managed *that, ExecutionEngine *e) { RegExpObject *re = static_cast(that); if (re->value()) re->value()->mark(e); Object::markObjects(that, e); } Property *RegExpObject::lastIndexProperty(ExecutionContext *ctx) { Q_UNUSED(ctx); Q_ASSERT(0 == internalClass()->find(ctx->d()->engine->newIdentifier(QStringLiteral("lastIndex")))); return propertyAt(0); } // Converts a JS RegExp to a QRegExp. // The conversion is not 100% exact since ECMA regexp and QRegExp // have different semantics/flags, but we try to do our best. QRegExp RegExpObject::toQRegExp() const { Qt::CaseSensitivity caseSensitivity = value()->ignoreCase() ? Qt::CaseInsensitive : Qt::CaseSensitive; return QRegExp(value()->pattern(), caseSensitivity, QRegExp::RegExp2); } QString RegExpObject::toString() const { QString result = QLatin1Char('/') + source(); result += QLatin1Char('/'); if (global()) result += QLatin1Char('g'); if (value()->ignoreCase()) result += QLatin1Char('i'); if (value()->multiLine()) result += QLatin1Char('m'); return result; } QString RegExpObject::source() const { Scope scope(engine()); ScopedString source(scope, scope.engine->newIdentifier(QStringLiteral("source"))); ScopedValue s(scope, const_cast(this)->get(source.getPointer())); return s->toQString(); } uint RegExpObject::flags() const { uint f = 0; if (global()) f |= QV4::RegExpObject::RegExp_Global; if (value()->ignoreCase()) f |= QV4::RegExpObject::RegExp_IgnoreCase; if (value()->multiLine()) f |= QV4::RegExpObject::RegExp_Multiline; return f; } DEFINE_OBJECT_VTABLE(RegExpCtor); RegExpCtor::RegExpCtor(ExecutionContext *scope) : FunctionObject(scope, QStringLiteral("RegExp")) { setVTable(staticVTable()); clearLastMatch(); } void RegExpCtor::clearLastMatch() { d()->lastMatch = Primitive::nullValue(); d()->lastInput = engine()->id_empty; d()->lastMatchStart = 0; d()->lastMatchEnd = 0; } ReturnedValue RegExpCtor::construct(Managed *m, CallData *callData) { ExecutionContext *ctx = m->engine()->currentContext(); Scope scope(ctx); ScopedValue r(scope, callData->argument(0)); ScopedValue f(scope, callData->argument(1)); Scoped re(scope, r); if (re) { if (!f->isUndefined()) return ctx->throwTypeError(); Scoped newRe(scope, re->value()); return Encode(ctx->d()->engine->newRegExpObject(newRe, re->global())); } QString pattern; if (!r->isUndefined()) pattern = r->toString(ctx)->toQString(); if (scope.hasException()) return Encode::undefined(); bool global = false; bool ignoreCase = false; bool multiLine = false; if (!f->isUndefined()) { f = RuntimeHelpers::toString(ctx, f); if (scope.hasException()) return Encode::undefined(); QString str = f->stringValue()->toQString(); for (int i = 0; i < str.length(); ++i) { if (str.at(i) == QLatin1Char('g') && !global) { global = true; } else if (str.at(i) == QLatin1Char('i') && !ignoreCase) { ignoreCase = true; } else if (str.at(i) == QLatin1Char('m') && !multiLine) { multiLine = true; } else { return ctx->throwSyntaxError(QStringLiteral("Invalid flags supplied to RegExp constructor")); } } } Scoped regexp(scope, RegExp::create(ctx->d()->engine, pattern, ignoreCase, multiLine)); if (!regexp->isValid()) return ctx->throwSyntaxError(QStringLiteral("Invalid regular expression")); return Encode(ctx->d()->engine->newRegExpObject(regexp, global)); } ReturnedValue RegExpCtor::call(Managed *that, CallData *callData) { if (callData->argc > 0 && callData->args[0].as()) { if (callData->argc == 1 || callData->args[1].isUndefined()) return callData->args[0].asReturnedValue(); } return construct(that, callData); } void RegExpCtor::markObjects(Managed *that, ExecutionEngine *e) { RegExpCtor *This = static_cast(that); This->lastMatch().mark(e); This->lastInput().mark(e); FunctionObject::markObjects(that, e); } void RegExpPrototype::init(ExecutionEngine *engine, ObjectRef ctor) { Scope scope(engine); ScopedObject o(scope); ctor->defineReadonlyProperty(engine->id_prototype, (o = this)); ctor->defineReadonlyProperty(engine->id_length, Primitive::fromInt32(2)); // Properties deprecated in the spec but required by "the web" :( ctor->defineAccessorProperty(QStringLiteral("lastMatch"), method_get_lastMatch_n<0>, 0); ctor->defineAccessorProperty(QStringLiteral("$&"), method_get_lastMatch_n<0>, 0); ctor->defineAccessorProperty(QStringLiteral("$1"), method_get_lastMatch_n<1>, 0); ctor->defineAccessorProperty(QStringLiteral("$2"), method_get_lastMatch_n<2>, 0); ctor->defineAccessorProperty(QStringLiteral("$3"), method_get_lastMatch_n<3>, 0); ctor->defineAccessorProperty(QStringLiteral("$4"), method_get_lastMatch_n<4>, 0); ctor->defineAccessorProperty(QStringLiteral("$5"), method_get_lastMatch_n<5>, 0); ctor->defineAccessorProperty(QStringLiteral("$6"), method_get_lastMatch_n<6>, 0); ctor->defineAccessorProperty(QStringLiteral("$7"), method_get_lastMatch_n<7>, 0); ctor->defineAccessorProperty(QStringLiteral("$8"), method_get_lastMatch_n<8>, 0); ctor->defineAccessorProperty(QStringLiteral("$9"), method_get_lastMatch_n<9>, 0); ctor->defineAccessorProperty(QStringLiteral("lastParen"), method_get_lastParen, 0); ctor->defineAccessorProperty(QStringLiteral("$+"), method_get_lastParen, 0); ctor->defineAccessorProperty(QStringLiteral("input"), method_get_input, 0); ctor->defineAccessorProperty(QStringLiteral("$_"), method_get_input, 0); ctor->defineAccessorProperty(QStringLiteral("leftContext"), method_get_leftContext, 0); ctor->defineAccessorProperty(QStringLiteral("$`"), method_get_leftContext, 0); ctor->defineAccessorProperty(QStringLiteral("rightContext"), method_get_rightContext, 0); ctor->defineAccessorProperty(QStringLiteral("$'"), method_get_rightContext, 0); defineDefaultProperty(QStringLiteral("constructor"), (o = ctor)); defineDefaultProperty(QStringLiteral("exec"), method_exec, 1); defineDefaultProperty(QStringLiteral("test"), method_test, 1); defineDefaultProperty(engine->id_toString, method_toString, 0); defineDefaultProperty(QStringLiteral("compile"), method_compile, 2); } ReturnedValue RegExpPrototype::method_exec(CallContext *ctx) { Scope scope(ctx); Scoped r(scope, ctx->d()->callData->thisObject.as()); if (!r) return ctx->throwTypeError(); ScopedValue arg(scope, ctx->argument(0)); arg = RuntimeHelpers::toString(ctx, arg); if (scope.hasException()) return Encode::undefined(); QString s = arg->stringValue()->toQString(); int offset = r->global() ? r->lastIndexProperty(ctx)->value.toInt32() : 0; if (offset < 0 || offset > s.length()) { r->lastIndexProperty(ctx)->value = Primitive::fromInt32(0); return Encode::null(); } uint* matchOffsets = (uint*)alloca(r->value()->captureCount() * 2 * sizeof(uint)); const int result = r->value()->match(s, offset, matchOffsets); Scoped regExpCtor(scope, ctx->d()->engine->regExpCtor); regExpCtor->clearLastMatch(); if (result == -1) { r->lastIndexProperty(ctx)->value = Primitive::fromInt32(0); return Encode::null(); } // fill in result data Scoped array(scope, ctx->d()->engine->newArrayObject(ctx->d()->engine->regExpExecArrayClass)); int len = r->value()->captureCount(); array->arrayReserve(len); ScopedValue v(scope); for (int i = 0; i < len; ++i) { int start = matchOffsets[i * 2]; int end = matchOffsets[i * 2 + 1]; v = (start != -1 && end != -1) ? ctx->d()->engine->newString(s.mid(start, end - start))->asReturnedValue() : Encode::undefined(); array->arrayPut(i, v); } array->setArrayLengthUnchecked(len); array->memberData()[Index_ArrayIndex] = Primitive::fromInt32(result); array->memberData()[Index_ArrayInput] = arg.asReturnedValue(); RegExpCtor::Data *dd = regExpCtor->d(); dd->lastMatch = array; dd->lastInput = arg->stringValue(); dd->lastMatchStart = matchOffsets[0]; dd->lastMatchEnd = matchOffsets[1]; if (r->global()) r->lastIndexProperty(ctx)->value = Primitive::fromInt32(matchOffsets[1]); return array.asReturnedValue(); } ReturnedValue RegExpPrototype::method_test(CallContext *ctx) { Scope scope(ctx); ScopedValue r(scope, method_exec(ctx)); return Encode(!r->isNull()); } ReturnedValue RegExpPrototype::method_toString(CallContext *ctx) { Scope scope(ctx); Scoped r(scope, ctx->d()->callData->thisObject.as()); if (!r) return ctx->throwTypeError(); return ctx->d()->engine->newString(r->toString())->asReturnedValue(); } ReturnedValue RegExpPrototype::method_compile(CallContext *ctx) { Scope scope(ctx); Scoped r(scope, ctx->d()->callData->thisObject.as()); if (!r) return ctx->throwTypeError(); ScopedCallData callData(scope, ctx->d()->callData->argc); memcpy(callData->args, ctx->d()->callData->args, ctx->d()->callData->argc*sizeof(Value)); Scoped re(scope, ctx->d()->engine->regExpCtor.asFunctionObject()->construct(callData)); r->d()->value = re->value(); r->d()->global = re->global(); return Encode::undefined(); } template ReturnedValue RegExpPrototype::method_get_lastMatch_n(CallContext *ctx) { Scope scope(ctx); ScopedArrayObject lastMatch(scope, static_cast(ctx->d()->engine->regExpCtor.objectValue())->lastMatch()); ScopedValue result(scope, lastMatch ? lastMatch->getIndexed(index) : Encode::undefined()); if (result->isUndefined()) return ctx->d()->engine->newString(QString())->asReturnedValue(); return result.asReturnedValue(); } ReturnedValue RegExpPrototype::method_get_lastParen(CallContext *ctx) { Scope scope(ctx); ScopedArrayObject lastMatch(scope, static_cast(ctx->d()->engine->regExpCtor.objectValue())->lastMatch()); ScopedValue result(scope, lastMatch ? lastMatch->getIndexed(lastMatch->getLength() - 1) : Encode::undefined()); if (result->isUndefined()) return ctx->d()->engine->newString(QString())->asReturnedValue(); return result.asReturnedValue(); } ReturnedValue RegExpPrototype::method_get_input(CallContext *ctx) { return static_cast(ctx->d()->engine->regExpCtor.objectValue())->lastInput().asReturnedValue(); } ReturnedValue RegExpPrototype::method_get_leftContext(CallContext *ctx) { Scope scope(ctx); Scoped regExpCtor(scope, ctx->d()->engine->regExpCtor); QString lastInput = regExpCtor->lastInput()->toQString(); return ctx->d()->engine->newString(lastInput.left(regExpCtor->lastMatchStart()))->asReturnedValue(); } ReturnedValue RegExpPrototype::method_get_rightContext(CallContext *ctx) { Scope scope(ctx); Scoped regExpCtor(scope, ctx->d()->engine->regExpCtor); QString lastInput = regExpCtor->lastInput()->toQString(); return ctx->d()->engine->newString(lastInput.mid(regExpCtor->lastMatchEnd()))->asReturnedValue(); } QT_END_NAMESPACE