summaryrefslogtreecommitdiffstats
path: root/kjs/regexp_object.cpp
diff options
context:
space:
mode:
authortoma <toma@283d02a7-25f6-0310-bc7c-ecb5cbfe19da>2009-11-25 17:56:58 +0000
committertoma <toma@283d02a7-25f6-0310-bc7c-ecb5cbfe19da>2009-11-25 17:56:58 +0000
commitce4a32fe52ef09d8f5ff1dd22c001110902b60a2 (patch)
tree5ac38a06f3dde268dc7927dc155896926aaf7012 /kjs/regexp_object.cpp
downloadtdelibs-ce4a32fe52ef09d8f5ff1dd22c001110902b60a2.tar.gz
tdelibs-ce4a32fe52ef09d8f5ff1dd22c001110902b60a2.zip
Copy the KDE 3.5 branch to branches/trinity for new KDE 3.5 features.
BUG:215923 git-svn-id: svn://anonsvn.kde.org/home/kde/branches/trinity/kdelibs@1054174 283d02a7-25f6-0310-bc7c-ecb5cbfe19da
Diffstat (limited to 'kjs/regexp_object.cpp')
-rw-r--r--kjs/regexp_object.cpp378
1 files changed, 378 insertions, 0 deletions
diff --git a/kjs/regexp_object.cpp b/kjs/regexp_object.cpp
new file mode 100644
index 000000000..edd2bbeca
--- /dev/null
+++ b/kjs/regexp_object.cpp
@@ -0,0 +1,378 @@
+// -*- c-basic-offset: 2 -*-
+/*
+ * This file is part of the KDE libraries
+ * Copyright (C) 1999-2000 Harri Porten (porten@kde.org)
+ * Copyright (C) 2003 Apple Computer, Inc.
+ *
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2 of the License, or (at your option) any later version.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with this library; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ *
+ */
+
+#include <stdio.h>
+
+#include "value.h"
+#include "object.h"
+#include "types.h"
+#include "interpreter.h"
+#include "operations.h"
+#include "internal.h"
+#include "regexp.h"
+#include "regexp_object.h"
+#include "error_object.h"
+#include "lookup.h"
+
+using namespace KJS;
+
+// ------------------------------ RegExpPrototypeImp ---------------------------
+
+// ECMA 15.9.4
+
+const ClassInfo RegExpPrototypeImp::info = {"RegExp", 0, 0, 0};
+
+RegExpPrototypeImp::RegExpPrototypeImp(ExecState *exec,
+ ObjectPrototypeImp *objProto,
+ FunctionPrototypeImp *funcProto)
+ : ObjectImp(objProto)
+{
+ Value protect(this);
+ setInternalValue(String(""));
+
+ // The constructor will be added later in RegExpObject's constructor (?)
+
+ static const Identifier execPropertyName("exec");
+ putDirect(execPropertyName,
+ new RegExpProtoFuncImp(exec,funcProto,RegExpProtoFuncImp::Exec, 0, execPropertyName), DontEnum);
+ static const Identifier testPropertyName("test");
+ putDirect(testPropertyName,
+ new RegExpProtoFuncImp(exec,funcProto,RegExpProtoFuncImp::Test, 0, testPropertyName), DontEnum);
+ putDirect(toStringPropertyName,
+ new RegExpProtoFuncImp(exec,funcProto,RegExpProtoFuncImp::ToString, 0, toStringPropertyName), DontEnum);
+ static const Identifier compilePropertyName("compile");
+ putDirect(compilePropertyName,
+ new RegExpProtoFuncImp(exec,funcProto,RegExpProtoFuncImp::Compile, 1, compilePropertyName), DontEnum);
+}
+
+// ------------------------------ RegExpProtoFuncImp ---------------------------
+
+RegExpProtoFuncImp::RegExpProtoFuncImp(ExecState * /*exec*/, FunctionPrototypeImp *funcProto,
+ int i, int len, const Identifier &_ident)
+ : InternalFunctionImp(funcProto), id(i)
+{
+ Value protect(this);
+ putDirect(lengthPropertyName, len, DontDelete|ReadOnly|DontEnum);
+ ident = _ident;
+}
+
+bool RegExpProtoFuncImp::implementsCall() const
+{
+ return true;
+}
+
+Value RegExpProtoFuncImp::call(ExecState *exec, Object &thisObj, const List &args)
+{
+ if (!thisObj.inherits(&RegExpImp::info)) {
+ if (thisObj.inherits(&RegExpPrototypeImp::info)) {
+ switch (id) {
+ case ToString: return String("//"); // FireFox returns /(?:)/
+ }
+ }
+ Object err = Error::create(exec,TypeError);
+ exec->setException(err);
+ return err;
+ }
+
+ RegExpImp *reimp = static_cast<RegExpImp*>(thisObj.imp());
+ RegExp *re = reimp->regExp();
+ String s;
+ UString str;
+ switch (id) {
+ case Exec: // 15.10.6.2
+ case Test:
+ {
+ s = args[0].toString(exec);
+ int length = s.value().size();
+
+ // Get values from the last time (in case of /g)
+ Value lastIndex = thisObj.get(exec,"lastIndex");
+ int i = lastIndex.isValid() ? lastIndex.toInt32(exec) : 0;
+ bool globalFlag = thisObj.get(exec,"global").toBoolean(exec);
+ if (!globalFlag)
+ i = 0;
+ if (i < 0 || i > length) {
+ thisObj.put(exec,"lastIndex", Number(0), DontDelete | DontEnum);
+ if (id == Test)
+ return Boolean(false);
+ else
+ return Null();
+ }
+ RegExpObjectImp* regExpObj = static_cast<RegExpObjectImp*>(exec->lexicalInterpreter()->builtinRegExp().imp());
+ int **ovector = regExpObj->registerRegexp( re, s.value() );
+
+ re->prepareMatch(s.value());
+ str = re->match(s.value(), i, 0L, ovector);
+ re->doneMatch();
+ regExpObj->setSubPatterns(re->subPatterns());
+
+ if (id == Test)
+ return Boolean(!str.isNull());
+
+ if (str.isNull()) // no match
+ {
+ if (globalFlag)
+ thisObj.put(exec,"lastIndex",Number(0), DontDelete | DontEnum);
+ return Null();
+ }
+ else // success
+ {
+ if (globalFlag)
+ thisObj.put(exec,"lastIndex",Number( (*ovector)[1] ), DontDelete | DontEnum);
+ return regExpObj->arrayOfMatches(exec,str);
+ }
+ }
+ break;
+ case ToString:
+ s = thisObj.get(exec,"source").toString(exec);
+ str = "/";
+ str += s.value();
+ str += "/";
+ if (thisObj.get(exec,"global").toBoolean(exec)) {
+ str += "g";
+ }
+ if (thisObj.get(exec,"ignoreCase").toBoolean(exec)) {
+ str += "i";
+ }
+ if (thisObj.get(exec,"multiline").toBoolean(exec)) {
+ str += "m";
+ }
+ return String(str);
+ case Compile: {
+ RegExp* newEngine = RegExpObjectImp::makeEngine(exec, args[0].toString(exec), args[1]);
+ if (!newEngine)
+ return exec->exception();
+ reimp->setRegExp(newEngine);
+ return Value(reimp);
+ }
+ }
+
+
+ return Undefined();
+}
+
+// ------------------------------ RegExpImp ------------------------------------
+
+const ClassInfo RegExpImp::info = {"RegExp", 0, 0, 0};
+
+RegExpImp::RegExpImp(RegExpPrototypeImp *regexpProto)
+ : ObjectImp(regexpProto), reg(0L)
+{
+}
+
+RegExpImp::~RegExpImp()
+{
+ delete reg;
+}
+
+void RegExpImp::setRegExp(RegExp *r)
+{
+ delete reg;
+ reg = r;
+
+ Object protect(this);//Protect self from GC (we are allocating a StringImp, and may be new)
+ putDirect("global", (r->flags() & RegExp::Global) ? BooleanImp::staticTrue : BooleanImp::staticFalse,
+ DontDelete | ReadOnly | DontEnum);
+ putDirect("ignoreCase", (r->flags() & RegExp::IgnoreCase) ? BooleanImp::staticTrue : BooleanImp::staticFalse,
+ DontDelete | ReadOnly | DontEnum);
+ putDirect("multiline", (r->flags() & RegExp::Multiline) ? BooleanImp::staticTrue : BooleanImp::staticFalse,
+ DontDelete | ReadOnly | DontEnum);
+
+ putDirect("source", new StringImp(r->pattern()), DontDelete | ReadOnly | DontEnum);
+ putDirect("lastIndex", NumberImp::zero(), DontDelete | DontEnum);
+}
+
+// ------------------------------ RegExpObjectImp ------------------------------
+
+RegExpObjectImp::RegExpObjectImp(ExecState * /*exec*/,
+ FunctionPrototypeImp *funcProto,
+ RegExpPrototypeImp *regProto)
+
+ : InternalFunctionImp(funcProto), lastOvector(0L), lastNrSubPatterns(0)
+{
+ Value protect(this);
+ // ECMA 15.10.5.1 RegExp.prototype
+ putDirect(prototypePropertyName, regProto, DontEnum|DontDelete|ReadOnly);
+
+ // no. of arguments for constructor
+ putDirect(lengthPropertyName, NumberImp::two(), ReadOnly|DontDelete|DontEnum);
+}
+
+RegExpObjectImp::~RegExpObjectImp()
+{
+ delete [] lastOvector;
+}
+
+int **RegExpObjectImp::registerRegexp( const RegExp* re, const UString& s )
+{
+ lastString = s;
+ delete [] lastOvector;
+ lastOvector = 0;
+ lastNrSubPatterns = re->subPatterns();
+ return &lastOvector;
+}
+
+Object RegExpObjectImp::arrayOfMatches(ExecState *exec, const UString &result) const
+{
+ List list;
+ // The returned array contains 'result' as first item, followed by the list of matches
+ list.append(String(result));
+ if ( lastOvector )
+ for ( unsigned int i = 1 ; i < lastNrSubPatterns + 1 ; ++i )
+ {
+ UString substring = lastString.substr( lastOvector[2*i], lastOvector[2*i+1] - lastOvector[2*i] );
+ list.append(String(substring));
+ }
+ Object arr = exec->lexicalInterpreter()->builtinArray().construct(exec, list);
+ arr.put(exec, "index", Number(lastOvector[0]));
+ arr.put(exec, "input", String(lastString));
+ return arr;
+}
+
+Value RegExpObjectImp::get(ExecState *exec, const Identifier &p) const
+{
+ UString s = p.ustring();
+ if (s[0] == '$' && lastOvector)
+ {
+ bool ok;
+ unsigned long i = s.substr(1).toULong(&ok);
+ if (ok)
+ {
+ if (i < lastNrSubPatterns + 1)
+ {
+ UString substring = lastString.substr( lastOvector[2*i], lastOvector[2*i+1] - lastOvector[2*i] );
+ return String(substring);
+ }
+ return String("");
+ }
+ }
+ return InternalFunctionImp::get(exec, p);
+}
+
+bool RegExpObjectImp::hasProperty(ExecState *exec, const Identifier &p) const
+{
+ UString s = p.ustring();
+ if (s[0] == '$' && lastOvector) {
+ bool ok;
+ (void)s.substr(1).toULong(&ok);
+ if (ok)
+ return true;
+ }
+
+ return InternalFunctionImp::hasProperty(exec, p);
+}
+
+bool RegExpObjectImp::implementsConstruct() const
+{
+ return true;
+}
+
+RegExp* RegExpObjectImp::makeEngine(ExecState *exec, const UString &p, const Value &flagsInput)
+{
+ UString flags = flagsInput.type() == UndefinedType ? UString("") : flagsInput.toString(exec);
+
+ // Check for validity of flags
+ for (int pos = 0; pos < flags.size(); ++pos) {
+ switch (flags[pos].unicode()) {
+ case 'g':
+ case 'i':
+ case 'm':
+ break;
+ default: {
+ Object err = Error::create(exec, SyntaxError,
+ "Invalid regular expression flags");
+ exec->setException(err);
+ return 0;
+ }
+ }
+ }
+
+ bool global = (flags.find("g") >= 0);
+ bool ignoreCase = (flags.find("i") >= 0);
+ bool multiline = (flags.find("m") >= 0);
+
+ int reflags = RegExp::None;
+ if (global)
+ reflags |= RegExp::Global;
+ if (ignoreCase)
+ reflags |= RegExp::IgnoreCase;
+ if (multiline)
+ reflags |= RegExp::Multiline;
+
+ RegExp *re = new RegExp(p, reflags);
+ if (!re->isValid()) {
+ Object err = Error::create(exec, SyntaxError,
+ "Invalid regular expression");
+ exec->setException(err);
+ delete re;
+ return 0;
+ }
+ return re;
+}
+
+// ECMA 15.10.4
+Object RegExpObjectImp::construct(ExecState *exec, const List &args)
+{
+ UString p;
+ if (args.isEmpty()) {
+ p = "";
+ } else {
+ Value a0 = args[0];
+ if (a0.isA(ObjectType) && a0.toObject(exec).inherits(&RegExpImp::info)) {
+ // It's a regexp. Check that no flags were passed.
+ if (args.size() > 1 && args[1].type() != UndefinedType) {
+ Object err = Error::create(exec,TypeError);
+ exec->setException(err);
+ return err;
+ }
+ RegExpImp *rimp = static_cast<RegExpImp*>(Object::dynamicCast(a0).imp());
+ p = rimp->regExp()->pattern();
+ } else {
+ p = a0.toString(exec);
+ }
+ }
+
+ RegExp* re = makeEngine(exec, p, args[1]);
+ if (!re)
+ return exec->exception().toObject(exec);
+
+ RegExpPrototypeImp *proto = static_cast<RegExpPrototypeImp*>(exec->lexicalInterpreter()->builtinRegExpPrototype().imp());
+ RegExpImp *dat = new RegExpImp(proto);
+ Object obj(dat); // protect from GC
+ dat->setRegExp(re);
+
+ return obj;
+}
+
+bool RegExpObjectImp::implementsCall() const
+{
+ return true;
+}
+
+// ECMA 15.10.3
+Value RegExpObjectImp::call(ExecState *exec, Object &/*thisObj*/,
+ const List &args)
+{
+ // TODO: handle RegExp argument case (15.10.3.1)
+
+ return construct(exec, args);
+}