blob: 971e20a2cf14fa64c3d1a1c81588872fd05ca6f0 [file] [log] [blame]
drh75897232000-05-29 14:26:00 +00001/*
drhb19a2bc2001-09-16 00:13:26 +00002** 2001 September 15
drh75897232000-05-29 14:26:00 +00003**
drhb19a2bc2001-09-16 00:13:26 +00004** The author disclaims copyright to this source code. In place of
5** a legal notice, here is a blessing:
drh75897232000-05-29 14:26:00 +00006**
drhb19a2bc2001-09-16 00:13:26 +00007** May you do good and not evil.
8** May you find forgiveness for yourself and forgive others.
9** May you share freely, never taking more than you give.
drh75897232000-05-29 14:26:00 +000010**
11*************************************************************************
12** This module contains C code that generates VDBE code used to process
13** the WHERE clause of SQL statements. Also found here are subroutines
14** to generate VDBE code to evaluate expressions.
15**
drhf57b3392001-10-08 13:22:32 +000016** $Id: where.c,v 1.22 2001/10/08 13:22:33 drh Exp $
drh75897232000-05-29 14:26:00 +000017*/
18#include "sqliteInt.h"
19
20/*
21** The query generator uses an array of instances of this structure to
22** help it analyze the subexpressions of the WHERE clause. Each WHERE
23** clause subexpression is separated from the others by an AND operator.
24*/
25typedef struct ExprInfo ExprInfo;
26struct ExprInfo {
27 Expr *p; /* Pointer to the subexpression */
28 int indexable; /* True if this subexprssion is usable by an index */
drh967e8b72000-06-21 13:59:10 +000029 int idxLeft; /* p->pLeft is a column in this table number. -1 if
30 ** p->pLeft is not the column of any table */
31 int idxRight; /* p->pRight is a column in this table number. -1 if
32 ** p->pRight is not the column of any table */
drh75897232000-05-29 14:26:00 +000033 unsigned prereqLeft; /* Tables referenced by p->pLeft */
34 unsigned prereqRight; /* Tables referenced by p->pRight */
35};
36
37/*
38** Determine the number of elements in an array.
39*/
40#define ARRAYSIZE(X) (sizeof(X)/sizeof(X[0]))
41
42/*
43** This routine is used to divide the WHERE expression into subexpressions
44** separated by the AND operator.
45**
46** aSlot[] is an array of subexpressions structures.
47** There are nSlot spaces left in this array. This routine attempts to
48** split pExpr into subexpressions and fills aSlot[] with those subexpressions.
49** The return value is the number of slots filled.
50*/
51static int exprSplit(int nSlot, ExprInfo *aSlot, Expr *pExpr){
52 int cnt = 0;
53 if( pExpr==0 || nSlot<1 ) return 0;
54 if( nSlot==1 || pExpr->op!=TK_AND ){
55 aSlot[0].p = pExpr;
56 return 1;
57 }
58 if( pExpr->pLeft->op!=TK_AND ){
59 aSlot[0].p = pExpr->pLeft;
60 cnt = 1 + exprSplit(nSlot-1, &aSlot[1], pExpr->pRight);
61 }else{
62 cnt = exprSplit(nSlot, aSlot, pExpr->pRight);
63 cnt += exprSplit(nSlot-cnt, &aSlot[cnt], pExpr->pLeft);
64 }
65 return cnt;
66}
67
68/*
69** This routine walks (recursively) an expression tree and generates
70** a bitmask indicating which tables are used in that expression
71** tree. Bit 0 of the mask is set if table 0 is used. But 1 is set
72** if table 1 is used. And so forth.
73**
74** In order for this routine to work, the calling function must have
75** previously invoked sqliteExprResolveIds() on the expression. See
76** the header comment on that routine for additional information.
drh19a775c2000-06-05 18:54:46 +000077**
78** "base" is the cursor number (the value of the iTable field) that
79** corresponds to the first entry in the table list. This is the
80** same as pParse->nTab.
drh75897232000-05-29 14:26:00 +000081*/
drh19a775c2000-06-05 18:54:46 +000082static int exprTableUsage(int base, Expr *p){
drh75897232000-05-29 14:26:00 +000083 unsigned int mask = 0;
84 if( p==0 ) return 0;
drh967e8b72000-06-21 13:59:10 +000085 if( p->op==TK_COLUMN ){
drh19a775c2000-06-05 18:54:46 +000086 return 1<< (p->iTable - base);
drh75897232000-05-29 14:26:00 +000087 }
88 if( p->pRight ){
drh19a775c2000-06-05 18:54:46 +000089 mask = exprTableUsage(base, p->pRight);
drh75897232000-05-29 14:26:00 +000090 }
91 if( p->pLeft ){
drh19a775c2000-06-05 18:54:46 +000092 mask |= exprTableUsage(base, p->pLeft);
drh75897232000-05-29 14:26:00 +000093 }
94 return mask;
95}
96
97/*
98** The input to this routine is an ExprInfo structure with only the
99** "p" field filled in. The job of this routine is to analyze the
100** subexpression and populate all the other fields of the ExprInfo
101** structure.
drh19a775c2000-06-05 18:54:46 +0000102**
103** "base" is the cursor number (the value of the iTable field) that
104** corresponds to the first entyr in the table list. This is the
105** same as pParse->nTab.
drh75897232000-05-29 14:26:00 +0000106*/
drh19a775c2000-06-05 18:54:46 +0000107static void exprAnalyze(int base, ExprInfo *pInfo){
drh75897232000-05-29 14:26:00 +0000108 Expr *pExpr = pInfo->p;
drh19a775c2000-06-05 18:54:46 +0000109 pInfo->prereqLeft = exprTableUsage(base, pExpr->pLeft);
110 pInfo->prereqRight = exprTableUsage(base, pExpr->pRight);
drh75897232000-05-29 14:26:00 +0000111 pInfo->indexable = 0;
112 pInfo->idxLeft = -1;
113 pInfo->idxRight = -1;
114 if( pExpr->op==TK_EQ && (pInfo->prereqRight & pInfo->prereqLeft)==0 ){
drh967e8b72000-06-21 13:59:10 +0000115 if( pExpr->pRight->op==TK_COLUMN ){
drh19a775c2000-06-05 18:54:46 +0000116 pInfo->idxRight = pExpr->pRight->iTable - base;
drh75897232000-05-29 14:26:00 +0000117 pInfo->indexable = 1;
118 }
drh967e8b72000-06-21 13:59:10 +0000119 if( pExpr->pLeft->op==TK_COLUMN ){
drh19a775c2000-06-05 18:54:46 +0000120 pInfo->idxLeft = pExpr->pLeft->iTable - base;
drh75897232000-05-29 14:26:00 +0000121 pInfo->indexable = 1;
122 }
123 }
124}
125
126/*
127** Generating the beginning of the loop used for WHERE clause processing.
128** The return value is a pointer to an (opaque) structure that contains
129** information needed to terminate the loop. Later, the calling routine
130** should invoke sqliteWhereEnd() with the return value of this function
131** in order to complete the WHERE clause processing.
132**
133** If an error occurs, this routine returns NULL.
134*/
135WhereInfo *sqliteWhereBegin(
136 Parse *pParse, /* The parser context */
137 IdList *pTabList, /* A list of all tables */
138 Expr *pWhere, /* The WHERE clause */
139 int pushKey /* If TRUE, leave the table key on the stack */
140){
141 int i; /* Loop counter */
142 WhereInfo *pWInfo; /* Will become the return value of this function */
143 Vdbe *v = pParse->pVdbe; /* The virtual database engine */
144 int brk, cont; /* Addresses used during code generation */
145 int *aOrder; /* Order in which pTabList entries are searched */
146 int nExpr; /* Number of subexpressions in the WHERE clause */
147 int loopMask; /* One bit set for each outer loop */
148 int haveKey; /* True if KEY is on the stack */
drh19a775c2000-06-05 18:54:46 +0000149 int base; /* First available index for OP_Open opcodes */
drh75897232000-05-29 14:26:00 +0000150 Index *aIdx[32]; /* Index to use on each nested loop. */
drhc4a3c772001-04-04 11:48:57 +0000151 int aDirect[32]; /* If TRUE, then index this table using ROWID */
drh75897232000-05-29 14:26:00 +0000152 ExprInfo aExpr[50]; /* The WHERE clause is divided into these expressions */
153
154 /* Allocate space for aOrder[]. */
155 aOrder = sqliteMalloc( sizeof(int) * pTabList->nId );
156
157 /* Allocate and initialize the WhereInfo structure that will become the
158 ** return value.
159 */
160 pWInfo = sqliteMalloc( sizeof(WhereInfo) );
drhdaffd0e2001-04-11 14:28:42 +0000161 if( sqlite_malloc_failed ){
drh75897232000-05-29 14:26:00 +0000162 sqliteFree(aOrder);
drhdaffd0e2001-04-11 14:28:42 +0000163 sqliteFree(pWInfo);
drh75897232000-05-29 14:26:00 +0000164 return 0;
165 }
166 pWInfo->pParse = pParse;
167 pWInfo->pTabList = pTabList;
drh19a775c2000-06-05 18:54:46 +0000168 base = pWInfo->base = pParse->nTab;
drh75897232000-05-29 14:26:00 +0000169
170 /* Split the WHERE clause into as many as 32 separate subexpressions
171 ** where each subexpression is separated by an AND operator. Any additional
172 ** subexpressions are attached in the aExpr[32] and will not enter
173 ** into the query optimizer computations. 32 is chosen as the cutoff
174 ** since that is the number of bits in an integer that we use for an
175 ** expression-used mask.
176 */
177 memset(aExpr, 0, sizeof(aExpr));
178 nExpr = exprSplit(ARRAYSIZE(aExpr), aExpr, pWhere);
179
180 /* Analyze all of the subexpressions.
181 */
182 for(i=0; i<nExpr; i++){
drh19a775c2000-06-05 18:54:46 +0000183 exprAnalyze(pParse->nTab, &aExpr[i]);
drh75897232000-05-29 14:26:00 +0000184 }
185
186 /* Figure out a good nesting order for the tables. aOrder[0] will
187 ** be the index in pTabList of the outermost table. aOrder[1] will
188 ** be the first nested loop and so on. aOrder[pTabList->nId-1] will
189 ** be the innermost loop.
190 **
drh7e391e12000-05-30 20:17:49 +0000191 ** Someday will put in a good algorithm here to reorder the loops
drh75897232000-05-29 14:26:00 +0000192 ** for an effiecient query. But for now, just use whatever order the
193 ** tables appear in in the pTabList.
194 */
195 for(i=0; i<pTabList->nId; i++){
196 aOrder[i] = i;
197 }
198
199 /* Figure out what index to use (if any) for each nested loop.
200 ** Make aIdx[i] point to the index to use for the i-th nested loop
201 ** where i==0 is the outer loop and i==pTabList->nId-1 is the inner
drhc4a3c772001-04-04 11:48:57 +0000202 ** loop. If the expression uses only the ROWID field, then set
203 ** aDirect[i] to 1.
drh75897232000-05-29 14:26:00 +0000204 **
205 ** Actually, if there are more than 32 tables in the join, only the
206 ** first 32 tables are candidates for indices.
207 */
208 loopMask = 0;
209 for(i=0; i<pTabList->nId && i<ARRAYSIZE(aIdx); i++){
drhc4a3c772001-04-04 11:48:57 +0000210 int j;
drh75897232000-05-29 14:26:00 +0000211 int idx = aOrder[i];
212 Table *pTab = pTabList->a[idx].pTab;
213 Index *pIdx;
214 Index *pBestIdx = 0;
215
drhc4a3c772001-04-04 11:48:57 +0000216 /* Check to see if there is an expression that uses only the
217 ** ROWID field of this table. If so, set aDirect[i] to 1.
218 ** If not, set aDirect[i] to 0.
219 */
220 aDirect[i] = 0;
221 for(j=0; j<nExpr; j++){
222 if( aExpr[j].idxLeft==idx && aExpr[j].p->pLeft->iColumn<0
223 && (aExpr[j].prereqRight & loopMask)==aExpr[j].prereqRight ){
224 aDirect[i] = 1;
225 break;
226 }
227 if( aExpr[j].idxRight==idx && aExpr[j].p->pRight->iColumn<0
228 && (aExpr[j].prereqLeft & loopMask)==aExpr[j].prereqLeft ){
229 aDirect[i] = 1;
230 break;
231 }
232 }
233 if( aDirect[i] ){
234 loopMask |= 1<<idx;
235 aIdx[i] = 0;
236 continue;
237 }
238
drh75897232000-05-29 14:26:00 +0000239 /* Do a search for usable indices. Leave pBestIdx pointing to
drh7e391e12000-05-30 20:17:49 +0000240 ** the most specific usable index.
drh75897232000-05-29 14:26:00 +0000241 **
242 ** "Most specific" means that pBestIdx is the usable index that
drh967e8b72000-06-21 13:59:10 +0000243 ** has the largest value for nColumn. A usable index is one for
244 ** which there are subexpressions to compute every column of the
drh75897232000-05-29 14:26:00 +0000245 ** index.
246 */
247 for(pIdx=pTab->pIndex; pIdx; pIdx=pIdx->pNext){
drh967e8b72000-06-21 13:59:10 +0000248 int columnMask = 0;
drh75897232000-05-29 14:26:00 +0000249
drh967e8b72000-06-21 13:59:10 +0000250 if( pIdx->nColumn>32 ) continue;
drh75897232000-05-29 14:26:00 +0000251 for(j=0; j<nExpr; j++){
252 if( aExpr[j].idxLeft==idx
253 && (aExpr[j].prereqRight & loopMask)==aExpr[j].prereqRight ){
drh967e8b72000-06-21 13:59:10 +0000254 int iColumn = aExpr[j].p->pLeft->iColumn;
drh75897232000-05-29 14:26:00 +0000255 int k;
drh967e8b72000-06-21 13:59:10 +0000256 for(k=0; k<pIdx->nColumn; k++){
257 if( pIdx->aiColumn[k]==iColumn ){
258 columnMask |= 1<<k;
drh75897232000-05-29 14:26:00 +0000259 break;
260 }
261 }
262 }
263 if( aExpr[j].idxRight==idx
264 && (aExpr[j].prereqLeft & loopMask)==aExpr[j].prereqLeft ){
drh967e8b72000-06-21 13:59:10 +0000265 int iColumn = aExpr[j].p->pRight->iColumn;
drh75897232000-05-29 14:26:00 +0000266 int k;
drh967e8b72000-06-21 13:59:10 +0000267 for(k=0; k<pIdx->nColumn; k++){
268 if( pIdx->aiColumn[k]==iColumn ){
269 columnMask |= 1<<k;
drh75897232000-05-29 14:26:00 +0000270 break;
271 }
272 }
273 }
274 }
drh967e8b72000-06-21 13:59:10 +0000275 if( columnMask + 1 == (1<<pIdx->nColumn) ){
276 if( pBestIdx==0 || pBestIdx->nColumn<pIdx->nColumn ){
drh75897232000-05-29 14:26:00 +0000277 pBestIdx = pIdx;
278 }
279 }
280 }
281 aIdx[i] = pBestIdx;
drh7e391e12000-05-30 20:17:49 +0000282 loopMask |= 1<<idx;
drh75897232000-05-29 14:26:00 +0000283 }
284
285 /* Open all tables in the pTabList and all indices in aIdx[].
286 */
287 for(i=0; i<pTabList->nId; i++){
drhf57b3392001-10-08 13:22:32 +0000288 int openOp;
289 Table *pTab;
290
291 pTab = pTabList->a[i].pTab;
292 openOp = pTab->isTemp ? OP_OpenAux : OP_Open;
293 sqliteVdbeAddOp(v, openOp, base+i, pTab->tnum, pTab->zName, 0);
drh50e5dad2001-09-15 00:57:28 +0000294 if( i==0 && !pParse->schemaVerified &&
295 (pParse->db->flags & SQLITE_InTrans)==0 ){
296 sqliteVdbeAddOp(v, OP_VerifyCookie, pParse->db->schema_cookie, 0, 0, 0);
297 pParse->schemaVerified = 1;
298 }
drh75897232000-05-29 14:26:00 +0000299 if( i<ARRAYSIZE(aIdx) && aIdx[i]!=0 ){
drhf57b3392001-10-08 13:22:32 +0000300 sqliteVdbeAddOp(v, openOp, base+pTabList->nId+i, aIdx[i]->tnum,
drh5e00f6c2001-09-13 13:46:56 +0000301 aIdx[i]->zName, 0);
drh75897232000-05-29 14:26:00 +0000302 }
303 }
drh19a775c2000-06-05 18:54:46 +0000304 memcpy(pWInfo->aIdx, aIdx, sizeof(aIdx));
drh75897232000-05-29 14:26:00 +0000305
306 /* Generate the code to do the search
307 */
308 pWInfo->iBreak = brk = sqliteVdbeMakeLabel(v);
309 loopMask = 0;
310 for(i=0; i<pTabList->nId; i++){
311 int j, k;
312 int idx = aOrder[i];
drhc4a3c772001-04-04 11:48:57 +0000313 int goDirect;
314 Index *pIdx;
drh75897232000-05-29 14:26:00 +0000315
drhc4a3c772001-04-04 11:48:57 +0000316 if( i<ARRAYSIZE(aIdx) ){
317 pIdx = aIdx[i];
318 goDirect = aDirect[i];
319 }else{
320 pIdx = 0;
321 goDirect = 0;
322 }
323
324 if( goDirect ){
325 /* Case 1: We can directly reference a single row using the ROWID field.
326 */
327 cont = brk;
328 for(k=0; k<nExpr; k++){
329 if( aExpr[k].p==0 ) continue;
330 if( aExpr[k].idxLeft==idx
331 && (aExpr[k].prereqRight & loopMask)==aExpr[k].prereqRight
332 && aExpr[k].p->pLeft->iColumn<0
333 ){
334 sqliteExprCode(pParse, aExpr[k].p->pRight);
335 aExpr[k].p = 0;
336 break;
337 }
338 if( aExpr[k].idxRight==idx
339 && (aExpr[k].prereqLeft & loopMask)==aExpr[k].prereqLeft
340 && aExpr[k].p->pRight->iColumn<0
341 ){
342 sqliteExprCode(pParse, aExpr[k].p->pLeft);
343 aExpr[k].p = 0;
344 break;
345 }
346 }
347 sqliteVdbeAddOp(v, OP_AddImm, 0, 0, 0, 0);
348 if( i==pTabList->nId-1 && pushKey ){
349 haveKey = 1;
350 }else{
drh1eaa2692001-09-18 02:02:23 +0000351 sqliteVdbeAddOp(v, OP_NotFound, base+idx, brk, 0, 0);
drhc4a3c772001-04-04 11:48:57 +0000352 haveKey = 0;
353 }
354 }else if( pIdx==0 ){
355 /* Case 2: There was no usable index. We must do a complete
drh75897232000-05-29 14:26:00 +0000356 ** scan of the table.
357 */
drhd78eeee2001-09-13 16:18:53 +0000358 sqliteVdbeAddOp(v, OP_Rewind, base+idx, 0, 0, 0);
drhc4a3c772001-04-04 11:48:57 +0000359 cont = sqliteVdbeMakeLabel(v);
drh19a775c2000-06-05 18:54:46 +0000360 sqliteVdbeAddOp(v, OP_Next, base+idx, brk, 0, cont);
drh75897232000-05-29 14:26:00 +0000361 haveKey = 0;
362 }else{
drhc4a3c772001-04-04 11:48:57 +0000363 /* Case 3: We do have a usable index in pIdx.
drh75897232000-05-29 14:26:00 +0000364 */
drhc4a3c772001-04-04 11:48:57 +0000365 cont = sqliteVdbeMakeLabel(v);
drh967e8b72000-06-21 13:59:10 +0000366 for(j=0; j<pIdx->nColumn; j++){
drh75897232000-05-29 14:26:00 +0000367 for(k=0; k<nExpr; k++){
368 if( aExpr[k].p==0 ) continue;
369 if( aExpr[k].idxLeft==idx
370 && (aExpr[k].prereqRight & loopMask)==aExpr[k].prereqRight
drh967e8b72000-06-21 13:59:10 +0000371 && aExpr[k].p->pLeft->iColumn==pIdx->aiColumn[j]
drh75897232000-05-29 14:26:00 +0000372 ){
373 sqliteExprCode(pParse, aExpr[k].p->pRight);
374 aExpr[k].p = 0;
375 break;
376 }
377 if( aExpr[k].idxRight==idx
378 && (aExpr[k].prereqLeft & loopMask)==aExpr[k].prereqLeft
drh967e8b72000-06-21 13:59:10 +0000379 && aExpr[k].p->pRight->iColumn==pIdx->aiColumn[j]
drh75897232000-05-29 14:26:00 +0000380 ){
381 sqliteExprCode(pParse, aExpr[k].p->pLeft);
382 aExpr[k].p = 0;
383 break;
384 }
385 }
386 }
drh967e8b72000-06-21 13:59:10 +0000387 sqliteVdbeAddOp(v, OP_MakeKey, pIdx->nColumn, 0, 0, 0);
drhc87fa692001-08-19 18:19:46 +0000388 sqliteVdbeAddOp(v, OP_BeginIdx, base+pTabList->nId+i, 0, 0, 0);
drh19a775c2000-06-05 18:54:46 +0000389 sqliteVdbeAddOp(v, OP_NextIdx, base+pTabList->nId+i, brk, 0, cont);
drh75897232000-05-29 14:26:00 +0000390 if( i==pTabList->nId-1 && pushKey ){
391 haveKey = 1;
392 }else{
drhbe0072d2001-09-13 14:46:09 +0000393 sqliteVdbeAddOp(v, OP_MoveTo, base+idx, 0, 0, 0);
drh75897232000-05-29 14:26:00 +0000394 haveKey = 0;
395 }
396 }
397 loopMask |= 1<<idx;
398
399 /* Insert code to test every subexpression that can be completely
400 ** computed using the current set of tables.
401 */
402 for(j=0; j<nExpr; j++){
403 if( aExpr[j].p==0 ) continue;
404 if( (aExpr[j].prereqRight & loopMask)!=aExpr[j].prereqRight ) continue;
405 if( (aExpr[j].prereqLeft & loopMask)!=aExpr[j].prereqLeft ) continue;
406 if( haveKey ){
drh573bd272001-02-19 23:23:38 +0000407 haveKey = 0;
drhbe0072d2001-09-13 14:46:09 +0000408 sqliteVdbeAddOp(v, OP_MoveTo, base+idx, 0, 0, 0);
drh75897232000-05-29 14:26:00 +0000409 }
410 sqliteExprIfFalse(pParse, aExpr[j].p, cont);
411 aExpr[j].p = 0;
412 }
413 brk = cont;
414 }
415 pWInfo->iContinue = cont;
416 if( pushKey && !haveKey ){
drhbe0072d2001-09-13 14:46:09 +0000417 sqliteVdbeAddOp(v, OP_Recno, base, 0, 0, 0);
drh75897232000-05-29 14:26:00 +0000418 }
419 sqliteFree(aOrder);
420 return pWInfo;
421}
422
423/*
424** Generate the end of the WHERE loop.
425*/
426void sqliteWhereEnd(WhereInfo *pWInfo){
427 Vdbe *v = pWInfo->pParse->pVdbe;
drh19a775c2000-06-05 18:54:46 +0000428 int i;
429 int brk = pWInfo->iBreak;
430 int base = pWInfo->base;
431
drh75897232000-05-29 14:26:00 +0000432 sqliteVdbeAddOp(v, OP_Goto, 0, pWInfo->iContinue, 0, 0);
drh19a775c2000-06-05 18:54:46 +0000433 for(i=0; i<pWInfo->pTabList->nId; i++){
434 sqliteVdbeAddOp(v, OP_Close, base+i, 0, 0, brk);
435 brk = 0;
436 if( i<ARRAYSIZE(pWInfo->aIdx) && pWInfo->aIdx[i]!=0 ){
437 sqliteVdbeAddOp(v, OP_Close, base+pWInfo->pTabList->nId+i, 0, 0, 0);
438 }
439 }
440 if( brk!=0 ){
441 sqliteVdbeAddOp(v, OP_Noop, 0, 0, 0, brk);
442 }
drh75897232000-05-29 14:26:00 +0000443 sqliteFree(pWInfo);
444 return;
445}