You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
tdelibs/kjs/regexp_object.cpp

378 lines
11 KiB

/*
* This file is part of the KDE libraries
* Copyright (C) 1999-2000 Harri Porten (porten@kde.org)
* Copyright (C) 2003 Apple Computer, Inc.
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this library; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*
*/
#include <stdio.h>
#include "value.h"
#include "object.h"
#include "types.h"
#include "interpreter.h"
#include "operations.h"
#include "internal.h"
#include "regexp.h"
#include "regexp_object.h"
#include "error_object.h"
#include "lookup.h"
using namespace KJS;
// ------------------------------ RegExpPrototypeImp ---------------------------
// ECMA 15.9.4
const ClassInfo RegExpPrototypeImp::info = {"RegExp", 0, 0, 0};
RegExpPrototypeImp::RegExpPrototypeImp(ExecState *exec,
ObjectPrototypeImp *objProto,
FunctionPrototypeImp *funcProto)
: ObjectImp(objProto)
{
Value protect(this);
setInternalValue(String(""));
// The constructor will be added later in RegExpObject's constructor (?)
static const Identifier execPropertyName("exec");
putDirect(execPropertyName,
new RegExpProtoFuncImp(exec,funcProto,RegExpProtoFuncImp::Exec, 0, execPropertyName), DontEnum);
static const Identifier testPropertyName("test");
putDirect(testPropertyName,
new RegExpProtoFuncImp(exec,funcProto,RegExpProtoFuncImp::Test, 0, testPropertyName), DontEnum);
putDirect(toStringPropertyName,
new RegExpProtoFuncImp(exec,funcProto,RegExpProtoFuncImp::ToString, 0, toStringPropertyName), DontEnum);
static const Identifier compilePropertyName("compile");
putDirect(compilePropertyName,
new RegExpProtoFuncImp(exec,funcProto,RegExpProtoFuncImp::Compile, 1, compilePropertyName), DontEnum);
}
// ------------------------------ RegExpProtoFuncImp ---------------------------
RegExpProtoFuncImp::RegExpProtoFuncImp(ExecState * /*exec*/, FunctionPrototypeImp *funcProto,
int i, int len, const Identifier &_ident)
: InternalFunctionImp(funcProto), id(i)
{
Value protect(this);
putDirect(lengthPropertyName, len, DontDelete|ReadOnly|DontEnum);
ident = _ident;
}
bool RegExpProtoFuncImp::implementsCall() const
{
return true;
}
Value RegExpProtoFuncImp::call(ExecState *exec, Object &thisObj, const List &args)
{
if (!thisObj.inherits(&RegExpImp::info)) {
if (thisObj.inherits(&RegExpPrototypeImp::info)) {
switch (id) {
case ToString: return String("//"); // FireFox returns /(?:)/
}
}
Object err = Error::create(exec,TypeError);
exec->setException(err);
return err;
}
RegExpImp *reimp = static_cast<RegExpImp*>(thisObj.imp());
RegExp *re = reimp->regExp();
String s;
UString str;
switch (id) {
case Exec: // 15.10.6.2
case Test:
{
s = args[0].toString(exec);
int length = s.value().size();
// Get values from the last time (in case of /g)
Value lastIndex = thisObj.get(exec,"lastIndex");
int i = lastIndex.isValid() ? lastIndex.toInt32(exec) : 0;
bool globalFlag = thisObj.get(exec,"global").toBoolean(exec);
if (!globalFlag)
i = 0;
if (i < 0 || i > length) {
thisObj.put(exec,"lastIndex", Number(0), DontDelete | DontEnum);
if (id == Test)
return Boolean(false);
else
return Null();
}
RegExpObjectImp* regExpObj = static_cast<RegExpObjectImp*>(exec->lexicalInterpreter()->builtinRegExp().imp());
int **ovector = regExpObj->registerRegexp( re, s.value() );
re->prepareMatch(s.value());
str = re->match(s.value(), i, 0L, ovector);
re->doneMatch();
regExpObj->setSubPatterns(re->subPatterns());
if (id == Test)
return Boolean(!str.isNull());
if (str.isNull()) // no match
{
if (globalFlag)
thisObj.put(exec,"lastIndex",Number(0), DontDelete | DontEnum);
return Null();
}
else // success
{
if (globalFlag)
thisObj.put(exec,"lastIndex",Number( (*ovector)[1] ), DontDelete | DontEnum);
return regExpObj->arrayOfMatches(exec,str);
}
}
break;
case ToString:
s = thisObj.get(exec,"source").toString(exec);
str = "/";
str += s.value();
str += "/";
if (thisObj.get(exec,"global").toBoolean(exec)) {
str += "g";
}
if (thisObj.get(exec,"ignoreCase").toBoolean(exec)) {
str += "i";
}
if (thisObj.get(exec,"multiline").toBoolean(exec)) {
str += "m";
}
return String(str);
case Compile: {
RegExp* newEngine = RegExpObjectImp::makeEngine(exec, args[0].toString(exec), args[1]);
if (!newEngine)
return exec->exception();
reimp->setRegExp(newEngine);
return Value(reimp);
}
}
return Undefined();
}
// ------------------------------ RegExpImp ------------------------------------
const ClassInfo RegExpImp::info = {"RegExp", 0, 0, 0};
RegExpImp::RegExpImp(RegExpPrototypeImp *regexpProto)
: ObjectImp(regexpProto), reg(0L)
{
}
RegExpImp::~RegExpImp()
{
delete reg;
}
void RegExpImp::setRegExp(RegExp *r)
{
delete reg;
reg = r;
Object protect(this);//Protect self from GC (we are allocating a StringImp, and may be new)
putDirect("global", (r->flags() & RegExp::Global) ? BooleanImp::staticTrue : BooleanImp::staticFalse,
DontDelete | ReadOnly | DontEnum);
putDirect("ignoreCase", (r->flags() & RegExp::IgnoreCase) ? BooleanImp::staticTrue : BooleanImp::staticFalse,
DontDelete | ReadOnly | DontEnum);
putDirect("multiline", (r->flags() & RegExp::Multiline) ? BooleanImp::staticTrue : BooleanImp::staticFalse,
DontDelete | ReadOnly | DontEnum);
putDirect("source", new StringImp(r->pattern()), DontDelete | ReadOnly | DontEnum);
putDirect("lastIndex", NumberImp::zero(), DontDelete | DontEnum);
}
// ------------------------------ RegExpObjectImp ------------------------------
RegExpObjectImp::RegExpObjectImp(ExecState * /*exec*/,
FunctionPrototypeImp *funcProto,
RegExpPrototypeImp *regProto)
: InternalFunctionImp(funcProto), lastOvector(0L), lastNrSubPatterns(0)
{
Value protect(this);
// ECMA 15.10.5.1 RegExp.prototype
putDirect(prototypePropertyName, regProto, DontEnum|DontDelete|ReadOnly);
// no. of arguments for constructor
putDirect(lengthPropertyName, NumberImp::two(), ReadOnly|DontDelete|DontEnum);
}
RegExpObjectImp::~RegExpObjectImp()
{
delete [] lastOvector;
}
int **RegExpObjectImp::registerRegexp( const RegExp* re, const UString& s )
{
lastString = s;
delete [] lastOvector;
lastOvector = 0;
lastNrSubPatterns = re->subPatterns();
return &lastOvector;
}
Object RegExpObjectImp::arrayOfMatches(ExecState *exec, const UString &result) const
{
List list;
// The returned array contains 'result' as first item, followed by the list of matches
list.append(String(result));
if ( lastOvector )
for ( unsigned int i = 1 ; i < lastNrSubPatterns + 1 ; ++i )
{
UString substring = lastString.substr( lastOvector[2*i], lastOvector[2*i+1] - lastOvector[2*i] );
list.append(String(substring));
}
Object arr = exec->lexicalInterpreter()->builtinArray().construct(exec, list);
arr.put(exec, "index", Number(lastOvector[0]));
arr.put(exec, "input", String(lastString));
return arr;
}
Value RegExpObjectImp::get(ExecState *exec, const Identifier &p) const
{
UString s = p.ustring();
if (s[0] == '$' && lastOvector)
{
bool ok;
unsigned long i = s.substr(1).toULong(&ok);
if (ok)
{
if (i < lastNrSubPatterns + 1)
{
UString substring = lastString.substr( lastOvector[2*i], lastOvector[2*i+1] - lastOvector[2*i] );
return String(substring);
}
return String("");
}
}
return InternalFunctionImp::get(exec, p);
}
bool RegExpObjectImp::hasProperty(ExecState *exec, const Identifier &p) const
{
UString s = p.ustring();
if (s[0] == '$' && lastOvector) {
bool ok;
(void)s.substr(1).toULong(&ok);
if (ok)
return true;
}
return InternalFunctionImp::hasProperty(exec, p);
}
bool RegExpObjectImp::implementsConstruct() const
{
return true;
}
RegExp* RegExpObjectImp::makeEngine(ExecState *exec, const UString &p, const Value &flagsInput)
{
UString flags = flagsInput.type() == UndefinedType ? UString("") : flagsInput.toString(exec);
// Check for validity of flags
for (int pos = 0; pos < flags.size(); ++pos) {
switch (flags[pos].unicode()) {
case 'g':
case 'i':
case 'm':
break;
default: {
Object err = Error::create(exec, SyntaxError,
"Invalid regular expression flags");
exec->setException(err);
return 0;
}
}
}
bool global = (flags.find("g") >= 0);
bool ignoreCase = (flags.find("i") >= 0);
bool multiline = (flags.find("m") >= 0);
int reflags = RegExp::None;
if (global)
reflags |= RegExp::Global;
if (ignoreCase)
reflags |= RegExp::IgnoreCase;
if (multiline)
reflags |= RegExp::Multiline;
RegExp *re = new RegExp(p, reflags);
if (!re->isValid()) {
Object err = Error::create(exec, SyntaxError,
"Invalid regular expression");
exec->setException(err);
delete re;
return 0;
}
return re;
}
// ECMA 15.10.4
Object RegExpObjectImp::construct(ExecState *exec, const List &args)
{
UString p;
if (args.isEmpty()) {
p = "";
} else {
Value a0 = args[0];
if (a0.isA(ObjectType) && a0.toObject(exec).inherits(&RegExpImp::info)) {
// It's a regexp. Check that no flags were passed.
if (args.size() > 1 && args[1].type() != UndefinedType) {
Object err = Error::create(exec,TypeError);
exec->setException(err);
return err;
}
RegExpImp *rimp = static_cast<RegExpImp*>(Object::dynamicCast(a0).imp());
p = rimp->regExp()->pattern();
} else {
p = a0.toString(exec);
}
}
RegExp* re = makeEngine(exec, p, args[1]);
if (!re)
return exec->exception().toObject(exec);
RegExpPrototypeImp *proto = static_cast<RegExpPrototypeImp*>(exec->lexicalInterpreter()->builtinRegExpPrototype().imp());
RegExpImp *dat = new RegExpImp(proto);
Object obj(dat); // protect from GC
dat->setRegExp(re);
return obj;
}
bool RegExpObjectImp::implementsCall() const
{
return true;
}
// ECMA 15.10.3
Value RegExpObjectImp::call(ExecState *exec, Object &/*thisObj*/,
const List &args)
{
// TODO: handle RegExp argument case (15.10.3.1)
return construct(exec, args);
}