Files
mongo/db/query.cpp

490 lines
12 KiB
C++
Raw Normal View History

2007-10-19 19:35:48 -04:00
// query.cpp
#include "stdafx.h"
#include "query.h"
#include "pdfile.h"
#include "jsobj.h"
#include "../util/builder.h"
2007-11-04 16:17:44 -05:00
#include <time.h>
2007-11-04 20:47:12 -05:00
#include "introspect.h"
2007-11-10 16:46:30 -05:00
#include "btree.h"
2008-01-20 17:42:26 -05:00
#include "../util/lruishmap.h"
//ns->query->DiskLoc
LRUishMap<JSObj,DiskLoc,5> lrutest(123);
2007-10-19 19:35:48 -04:00
int nextCursorId = 1;
2007-12-06 19:03:23 -05:00
JSObj emptyObj;
2007-11-11 14:21:02 -05:00
/* todo: _ cache query plans
_ use index on partial match with the query
*/
auto_ptr<Cursor> getIndexCursor(const char *ns, JSObj& query, JSObj& order) {
2008-01-20 17:42:26 -05:00
NamespaceDetails *d = nsdetails(ns);
2007-11-11 14:21:02 -05:00
if( d == 0 ) return auto_ptr<Cursor>();
set<string> queryFields;
query.getFieldNames(queryFields);
if( !order.isEmpty() ) {
set<string> orderFields;
order.getFieldNames(orderFields);
// order by
for(int i = 0; i < d->nIndexes; i++ ) {
JSObj idxInfo = d->indexes[i].info.obj();
assert( strcmp(ns, idxInfo.getStringField("ns")) == 0 );
JSObj idxKey = idxInfo.getObjectField("key");
set<string> keyFields;
idxKey.getFieldNames(keyFields);
if( keyFields == orderFields ) {
2007-11-12 19:22:33 -05:00
bool reverse =
order.firstElement().type() == Number &&
order.firstElement().number() < 0;
2007-11-11 14:21:02 -05:00
JSObjBuilder b;
2007-12-06 17:04:20 -05:00
#if defined(_WIN32)
2007-12-16 20:45:25 -05:00
if( 0 ) {
2007-12-06 17:04:20 -05:00
cout<< "TEMP FULLVALIDATE" << endl;
d->indexes[i].head.btree()->fullValidate(d->indexes[i].head);
{
stringstream ss;
d->indexes[i].head.btree()->shape(ss);
cout << ss.str() << endl;
}
2007-12-16 20:45:25 -05:00
}
2007-12-06 17:04:20 -05:00
#endif
2007-12-06 19:03:23 -05:00
return auto_ptr<Cursor>(new BtreeCursor(d->indexes[i].head, reverse ? maxKey : emptyObj, reverse ? -1 : 1, false));
2007-11-11 14:21:02 -05:00
}
}
}
// where/query
for(int i = 0; i < d->nIndexes; i++ ) {
JSObj idxInfo = d->indexes[i].info.obj();
JSObj idxKey = idxInfo.getObjectField("key");
set<string> keyFields;
idxKey.getFieldNames(keyFields);
if( keyFields == queryFields ) {
JSObjBuilder b;
2007-11-25 18:20:54 -05:00
JSObj q = query.extractFields(idxKey, b);
/* regexp: only supported if form is /^text/ */
JSObjBuilder b2;
JSElemIter it(q);
while( it.more() ) {
Element e = it.next();
if( e.eoo() )
break;
if( e.type() == RegEx ) {
if( *e.regexFlags() )
goto fail;
const char *re = e.regex();
const char *p = re;
if( *p++ != '^' ) goto fail;
while( *p ) {
2007-12-01 14:07:05 -05:00
if( *p == ' ' || (*p>='0'&&*p<='9') || (*p>='@'&&*p<='Z') || (*p>='a'&&*p<='z') )
;
else
2007-11-25 18:20:54 -05:00
goto fail;
p++;
}
if( it.more() && !it.next().eoo() ) // we must be the last part of the key (for now until we are smarter)
goto fail;
// ok!
b2.append(e.fieldName(), re+1);
break;
}
else
b2.append(e);
}
JSObj q2 = b2.done();
// cout << "\nquery old: " << q.toString() << " new:" << q2.toString() << endl;
2007-11-11 14:21:02 -05:00
return auto_ptr<Cursor>(
2007-11-25 18:20:54 -05:00
new BtreeCursor(d->indexes[i].head, q2, 1, true));
2007-11-11 14:21:02 -05:00
}
}
2007-11-25 18:20:54 -05:00
fail:
2007-11-11 14:21:02 -05:00
return auto_ptr<Cursor>();
}
2007-10-30 05:50:14 -04:00
void deleteObjects(const char *ns, JSObj pattern, bool justOne) {
// cout << "delete ns:" << ns << " queryobjsize:" <<
// pattern.objsize() << endl;
2007-10-30 05:50:14 -04:00
2008-01-20 17:42:26 -05:00
if( strstr(ns, ".system.") ) {
2007-11-02 21:30:40 -04:00
cout << "ERROR: attempt to delete in system namespace " << ns << endl;
return;
}
2007-10-30 05:50:14 -04:00
JSMatcher matcher(pattern);
2007-11-11 14:21:02 -05:00
JSObj order;
auto_ptr<Cursor> c = getIndexCursor(ns, pattern, order);
if( c.get() == 0 )
c = theDataFileMgr.findAll(ns);
2007-11-01 22:34:44 -04:00
while( c->ok() ) {
Record *r = c->_current();
DiskLoc rloc = c->currLoc();
c->advance(); // must advance before deleting as the next ptr will die
2007-10-30 05:50:14 -04:00
JSObj js(r);
2007-11-24 16:15:09 -05:00
bool deep;
if( !matcher.matches(js, &deep) ) {
2007-11-11 14:21:02 -05:00
if( c->tempStopOnMiss() )
break;
}
2007-11-24 16:15:09 -05:00
else {
assert( !deep || !c->dup(rloc) ); // can't be a dup, we deleted it!
// cout << " found match to delete" << endl;
2007-11-11 14:21:02 -05:00
if( !justOne )
c->noteLocation();
2007-10-30 05:50:14 -04:00
theDataFileMgr.deleteRecord(ns, r, rloc);
if( justOne )
return;
2007-11-11 14:21:02 -05:00
c->checkLocation();
2007-10-30 05:50:14 -04:00
}
}
}
2007-12-24 20:59:58 -05:00
struct Mod {
const char *fieldName;
double n;
};
void applyMods(vector<Mod>& mods, JSObj obj) {
for( vector<Mod>::iterator i = mods.begin(); i != mods.end(); i++ ) {
Mod& m = *i;
Element e = obj.findElement(m.fieldName);
if( e.type() == Number ) {
e.number() += m.n;
}
}
}
/* get special operations like $inc
{ $inc: { a:1, b:1 } }
*/
void getMods(vector<Mod>& mods, JSObj from) {
JSElemIter it(from);
while( it.more() ) {
Element e = it.next();
if( strcmp(e.fieldName(), "$inc") == 0 && e.type() == Object ) {
JSObj j = e.embeddedObject();
JSElemIter jt(j);
while( jt.more() ) {
Element f = jt.next();
if( f.eoo() )
break;
Mod m;
m.fieldName = f.fieldName();
if( f.type() == Number ) {
m.n = f.number();
cout <<"TEMP: " << m.fieldName << ' ' << m.n << endl;
mods.push_back(m);
}
}
}
}
}
2008-01-20 17:42:26 -05:00
/*
2007-12-24 20:59:58 -05:00
todo:
smart requery find record immediately
*/
2007-10-30 05:50:14 -04:00
void updateObjects(const char *ns, JSObj updateobj, JSObj pattern, bool upsert) {
2008-01-20 17:42:26 -05:00
//cout << "TEMP BAD";
//lrutest.find(updateobj);
2007-12-24 20:59:58 -05:00
// cout << "update ns:" << ns << " objsize:" << updateobj.objsize() << " queryobjsize:" <<
// pattern.objsize();
2007-10-30 05:50:14 -04:00
2008-01-20 17:42:26 -05:00
if( strstr(ns, ".system.") ) {
2007-11-13 16:44:01 -05:00
cout << "\nERROR: attempt to update in system namespace " << ns << endl;
2007-11-02 21:30:40 -04:00
return;
}
2007-11-11 18:28:33 -05:00
{
JSMatcher matcher(pattern);
JSObj order;
auto_ptr<Cursor> c = getIndexCursor(ns, pattern, order);
if( c.get() == 0 )
c = theDataFileMgr.findAll(ns);
while( c->ok() ) {
Record *r = c->_current();
JSObj js(r);
if( !matcher.matches(js) ) {
if( c->tempStopOnMiss() )
break;
}
else {
2007-11-24 16:15:09 -05:00
/* note: we only update one row and quit. if you do multiple later,
be careful or multikeys in arrays could break things badly. best
to only allow updating a single row with a multikey lookup.
*/
2007-12-24 20:59:58 -05:00
/* look for $inc etc. note as listed here, all fields to inc must be this type, you can't set some
regular ones at the moment. */
if( updateobj.firstElement().fieldName()[0] == '$' ) {
vector<Mod> mods;
getMods(mods, updateobj);
applyMods(mods, c->currLoc().obj());
return;
}
2007-11-11 18:28:33 -05:00
theDataFileMgr.update(ns, r, c->currLoc(), updateobj.objdata(), updateobj.objsize());
return;
}
c->advance();
2007-10-30 05:50:14 -04:00
}
}
2007-12-24 20:59:58 -05:00
if( upsert ) {
if( updateobj.firstElement().fieldName()[0] == '$' ) {
/* upsert of an $inc. build a default */
vector<Mod> mods;
getMods(mods, updateobj);
JSObjBuilder b;
b.appendElements(pattern);
for( vector<Mod>::iterator i = mods.begin(); i != mods.end(); i++ )
b.append(i->fieldName, i->n);
JSObj obj = b.done();
theDataFileMgr.insert(ns, (void*) obj.objdata(), obj.objsize());
return;
}
2007-10-30 05:50:14 -04:00
theDataFileMgr.insert(ns, (void*) updateobj.objdata(), updateobj.objsize());
2007-12-24 20:59:58 -05:00
}
2007-10-30 05:50:14 -04:00
}
2007-12-02 11:33:59 -05:00
int queryTraceLevel = 0;
int otherTraceLevel = 0;
// e.g.
// system.cmd$.find( { queryTraceLevel: 2 } );
2007-12-24 20:59:58 -05:00
//
// returns true if ran a cmd
//
inline bool runCommands(const char *ns, JSObj& jsobj, stringstream& ss, BufBuilder &b, JSObjBuilder& anObjBuilderForYa) {
2007-12-02 11:33:59 -05:00
if( strcmp(ns, "system.$cmd") != 0 )
2007-12-24 20:59:58 -05:00
return false;
2007-12-02 11:33:59 -05:00
ss << "\n $cmd: " << jsobj.toString();
2007-12-24 20:59:58 -05:00
bool ok = false;
bool valid = false;
2007-12-02 11:33:59 -05:00
Element e = jsobj.firstElement();
2007-12-24 20:59:58 -05:00
if( e.eoo() ) goto done;
2007-12-02 11:33:59 -05:00
if( e.type() == Number ) {
2007-12-24 20:59:58 -05:00
if( strcmp(e.fieldName(),"queryTraceLevel") == 0 ) {
valid = ok = true;
2007-12-02 11:33:59 -05:00
queryTraceLevel = (int) e.number();
2007-12-24 20:59:58 -05:00
} else if( strcmp(e.fieldName(),"traceAll") == 0 ) {
valid = ok = true;
2007-12-02 11:33:59 -05:00
queryTraceLevel = (int) e.number();
otherTraceLevel = (int) e.number();
}
}
else if( e.type() == String ) {
if( strcmp(e.fieldName(),"deleteIndexes") == 0 ) {
2007-12-24 20:59:58 -05:00
valid = true;
/* note: temp implementation. space not reclaimed! */
2008-01-20 17:42:26 -05:00
NamespaceDetails *d = nsdetails(e.valuestr());
cout << "CMD: deleteIndexes " << e.valuestr() << endl;
if( d ) {
2007-12-24 20:59:58 -05:00
ok = true;
cout << " d->nIndexes was " << d->nIndexes << endl;
2007-12-24 20:59:58 -05:00
anObjBuilderForYa.append("nIndexesWas", (double)d->nIndexes);
cout << " temp implementation, space not reclaimed" << endl;
d->nIndexes = 0;
}
2007-12-24 20:59:58 -05:00
else {
anObjBuilderForYa.append("errmsg", "ns not found");
}
}
}
2007-12-24 20:59:58 -05:00
done:
if( !valid )
anObjBuilderForYa.append("errmsg", "no such cmd");
anObjBuilderForYa.append("ok", ok?1.0:0.0);
JSObj x = anObjBuilderForYa.done();
b.append((void*) x.objdata(), x.objsize());
return true;
2007-12-02 11:33:59 -05:00
}
2007-12-01 11:44:42 -05:00
QueryResult* runQuery(const char *ns, int ntoreturn, JSObj jsobj,
auto_ptr< set<string> > filter, stringstream& ss) {
ss << "query:" << ns << " ntoreturn:" << ntoreturn;
if( jsobj.objsize() > 100 )
ss << " querysz:" << jsobj.objsize();
2007-12-02 11:33:59 -05:00
if( queryTraceLevel >= 1 )
cout << "query: " << jsobj.toString() << endl;
2007-10-19 19:35:48 -04:00
2007-12-24 20:59:58 -05:00
int n = 0;
2007-11-21 21:44:57 -05:00
BufBuilder b(32768);
2007-12-24 20:59:58 -05:00
JSObjBuilder cmdResBuf;
long long cursorid = 0;
2007-11-04 16:17:44 -05:00
2007-10-28 16:38:06 -04:00
b.skip(sizeof(QueryResult));
2007-10-19 19:35:48 -04:00
2007-12-24 20:59:58 -05:00
if( runCommands(ns, jsobj, ss, b, cmdResBuf) ) {
n = 1;
2007-12-02 11:33:59 -05:00
}
2007-12-24 20:59:58 -05:00
else {
2007-11-01 22:34:44 -04:00
2007-12-24 20:59:58 -05:00
JSObj query = jsobj.getObjectField("query");
JSObj order = jsobj.getObjectField("orderby");
if( query.isEmpty() && order.isEmpty() )
query = jsobj;
2007-12-16 20:45:25 -05:00
2007-12-24 20:59:58 -05:00
auto_ptr<JSMatcher> matcher(new JSMatcher(query));
auto_ptr<Cursor> c = getSpecialCursor(ns);
if( c.get() == 0 ) {
c = getIndexCursor(ns, query, order);
2007-11-10 16:46:30 -05:00
}
2007-12-24 20:59:58 -05:00
if( c.get() == 0 ) {
c = theDataFileMgr.findAll(ns);
if( queryTraceLevel >= 1 )
cout << " basiccursor" << endl;
}
int nscanned = 0;
while( c->ok() ) {
JSObj js = c->current();
if( queryTraceLevel >= 50 )
cout << " checking against:\n " << js.toString() << endl;
nscanned++;
bool deep;
if( !matcher->matches(js, &deep) ) {
if( c->tempStopOnMiss() )
2007-11-04 22:34:37 -05:00
break;
2007-12-24 20:59:58 -05:00
}
else if( !deep || !c->dup(c->currLoc()) ) {
bool ok = true;
if( filter.get() ) {
JSObj x;
ok = x.addFields(js, *filter) > 0;
if( ok )
b.append((void*) x.objdata(), x.objsize());
}
else {
b.append((void*) js.objdata(), js.objsize());
}
if( ok ) {
n++;
if( (ntoreturn>0 && (n >= ntoreturn || b.len() > 16*1024*1024)) ||
(ntoreturn==0 && b.len()>1*1024*1024) ) {
// more...so save a cursor
ClientCursor *cc = new ClientCursor();
cc->c = c;
cursorid = allocCursorId();
cc->cursorid = cursorid;
cc->matcher = matcher;
cc->ns = ns;
cc->pos = n;
ClientCursor::add(cc);
cc->updateLocation();
cc->filter = filter;
break;
}
2007-11-04 22:34:37 -05:00
}
2007-11-04 16:17:44 -05:00
}
2007-12-24 20:59:58 -05:00
c->advance();
2007-10-28 22:20:57 -04:00
}
2007-10-19 19:35:48 -04:00
2007-12-24 20:59:58 -05:00
if( queryTraceLevel >=2 )
cout << " nscanned:" << nscanned << "\n ";
}
2007-12-02 11:33:59 -05:00
2007-12-24 20:59:58 -05:00
QueryResult *qr = (QueryResult *) b.buf();
qr->_data[0] = 0;
qr->_data[1] = 0;
qr->_data[2] = 0;
qr->_data[3] = 0;
2007-10-19 19:35:48 -04:00
qr->len = b.len();
2007-12-01 11:44:42 -05:00
ss << " resLen:" << b.len();
2007-11-17 21:10:00 -05:00
// qr->channel = 0;
2007-10-19 19:35:48 -04:00
qr->operation = opReply;
2007-11-04 16:17:44 -05:00
qr->cursorId = cursorid;
2007-10-28 14:42:59 -04:00
qr->startingFrom = 0;
2007-10-19 19:35:48 -04:00
qr->nReturned = n;
b.decouple();
2007-12-01 11:44:42 -05:00
ss << " nReturned:" << n;
2007-10-19 19:35:48 -04:00
return qr;
}
2007-11-04 16:17:44 -05:00
QueryResult* getMore(const char *ns, int ntoreturn, long long cursorid) {
2007-12-01 11:44:42 -05:00
// cout << "getMore ns:" << ns << " ntoreturn:" << ntoreturn << " cursorid:" <<
// cursorid << endl;
2007-11-04 16:17:44 -05:00
2007-11-21 21:44:57 -05:00
BufBuilder b(32768);
2007-11-04 16:17:44 -05:00
ClientCursor *cc = 0;
CCMap::iterator it = clientCursors.find(cursorid);
if( it == clientCursors.end() ) {
cout << "Cursor not found in map. cursorid: " << cursorid << endl;
}
else {
cc = it->second;
}
b.skip(sizeof(QueryResult));
int start = 0;
int n = 0;
if( cc ) {
start = cc->pos;
Cursor *c = cc->c.get();
while( 1 ) {
if( !c->ok() ) {
2007-11-10 16:46:30 -05:00
done:
2007-11-04 16:17:44 -05:00
// done! kill cursor.
cursorid = 0;
clientCursors.erase(it);
delete cc;
cc = 0;
break;
}
JSObj js = c->current();
2007-11-24 16:15:09 -05:00
bool deep;
if( !cc->matcher->matches(js, &deep) ) {
2007-11-10 16:46:30 -05:00
if( c->tempStopOnMiss() )
goto done;
}
2007-11-24 16:15:09 -05:00
else if( !deep || !c->dup(c->currLoc()) ) {
2007-11-04 22:34:37 -05:00
bool ok = true;
if( cc->filter.get() ) {
JSObj x;
ok = x.addFields(js, *cc->filter) > 0;
if( ok )
b.append((void*) x.objdata(), x.objsize());
}
else {
b.append((void*) js.objdata(), js.objsize());
}
if( ok ) {
n++;
2007-11-05 11:55:03 -05:00
if( (ntoreturn>0 && (n >= ntoreturn || b.len() > 16*1024*1024)) ||
(ntoreturn==0 && b.len()>1*1024*1024) ) {
2007-11-04 22:34:37 -05:00
cc->pos += n;
cc->updateLocation();
break;
}
2007-11-04 16:17:44 -05:00
}
}
2007-11-26 16:43:28 -05:00
c->advance();
2007-11-04 16:17:44 -05:00
}
}
QueryResult *qr = (QueryResult *) b.buf();
qr->cursorId = cursorid;
qr->startingFrom = start;
qr->len = b.len();
2007-11-17 21:10:00 -05:00
// qr->reserved = 0;
2007-11-04 16:17:44 -05:00
qr->operation = opReply;
qr->nReturned = n;
b.decouple();
return qr;
}