blob: 2a84a5952a2135050365ed99b907ecb86c4162c3 [file] [log] [blame]
drh75897232000-05-29 14:26:00 +00001/*
drhb19a2bc2001-09-16 00:13:26 +00002** 2001 September 15
drh75897232000-05-29 14:26:00 +00003**
drhb19a2bc2001-09-16 00:13:26 +00004** The author disclaims copyright to this source code. In place of
5** a legal notice, here is a blessing:
drh75897232000-05-29 14:26:00 +00006**
drhb19a2bc2001-09-16 00:13:26 +00007** May you do good and not evil.
8** May you find forgiveness for yourself and forgive others.
9** May you share freely, never taking more than you give.
drh75897232000-05-29 14:26:00 +000010**
11*************************************************************************
12** This module contains C code that generates VDBE code used to process
drh909626d2008-05-30 14:58:37 +000013** the WHERE clause of SQL statements. This module is responsible for
drh51669862004-12-18 18:40:26 +000014** generating the code that loops through a table looking for applicable
15** rows. Indices are selected and used to speed the search when doing
16** so is applicable. Because this module is responsible for selecting
17** indices, you might also think of this module as the "query optimizer".
drh75897232000-05-29 14:26:00 +000018*/
19#include "sqliteInt.h"
drhe54df422013-11-12 18:37:25 +000020#include "whereInt.h"
drh51147ba2005-07-23 22:59:55 +000021
drh6f82e852015-06-06 20:12:09 +000022/* Forward declaration of methods */
23static int whereLoopResize(sqlite3*, WhereLoop*, int);
24
25/* Test variable that can be set to enable WHERE tracing */
26#if defined(SQLITE_TEST) || defined(SQLITE_DEBUG)
27/***/ int sqlite3WhereTrace = 0;
28#endif
29
30
drh51147ba2005-07-23 22:59:55 +000031/*
drh6f328482013-06-05 23:39:34 +000032** Return the estimated number of output rows from a WHERE clause
33*/
drhc63367e2013-06-10 20:46:50 +000034u64 sqlite3WhereOutputRowCount(WhereInfo *pWInfo){
drhbf539c42013-10-05 18:16:02 +000035 return sqlite3LogEstToInt(pWInfo->nRowOut);
drh6f328482013-06-05 23:39:34 +000036}
37
38/*
39** Return one of the WHERE_DISTINCT_xxxxx values to indicate how this
40** WHERE clause returns outputs for DISTINCT processing.
41*/
42int sqlite3WhereIsDistinct(WhereInfo *pWInfo){
43 return pWInfo->eDistinct;
44}
45
46/*
47** Return TRUE if the WHERE clause returns rows in ORDER BY order.
48** Return FALSE if the output needs to be sorted.
49*/
50int sqlite3WhereIsOrdered(WhereInfo *pWInfo){
drhddba0c22014-03-18 20:33:42 +000051 return pWInfo->nOBSat;
drh6f328482013-06-05 23:39:34 +000052}
53
54/*
55** Return the VDBE address or label to jump to in order to continue
56** immediately with the next row of a WHERE clause.
57*/
58int sqlite3WhereContinueLabel(WhereInfo *pWInfo){
drha22a75e2014-03-21 18:16:23 +000059 assert( pWInfo->iContinue!=0 );
drh6f328482013-06-05 23:39:34 +000060 return pWInfo->iContinue;
61}
62
63/*
64** Return the VDBE address or label to jump to in order to break
65** out of a WHERE loop.
66*/
67int sqlite3WhereBreakLabel(WhereInfo *pWInfo){
68 return pWInfo->iBreak;
69}
70
71/*
72** Return TRUE if an UPDATE or DELETE statement can operate directly on
73** the rowids returned by a WHERE clause. Return FALSE if doing an
74** UPDATE or DELETE might change subsequent WHERE clause results.
drhfc8d4f92013-11-08 15:19:46 +000075**
76** If the ONEPASS optimization is used (if this routine returns true)
77** then also write the indices of open cursors used by ONEPASS
78** into aiCur[0] and aiCur[1]. iaCur[0] gets the cursor of the data
79** table and iaCur[1] gets the cursor used by an auxiliary index.
80** Either value may be -1, indicating that cursor is not used.
81** Any cursors returned will have been opened for writing.
82**
83** aiCur[0] and aiCur[1] both get -1 if the where-clause logic is
84** unable to use the ONEPASS optimization.
drh6f328482013-06-05 23:39:34 +000085*/
drhfc8d4f92013-11-08 15:19:46 +000086int sqlite3WhereOkOnePass(WhereInfo *pWInfo, int *aiCur){
87 memcpy(aiCur, pWInfo->aiCurOnePass, sizeof(int)*2);
drh6f328482013-06-05 23:39:34 +000088 return pWInfo->okOnePass;
89}
90
91/*
drhaa32e3c2013-07-16 21:31:23 +000092** Move the content of pSrc into pDest
93*/
94static void whereOrMove(WhereOrSet *pDest, WhereOrSet *pSrc){
95 pDest->n = pSrc->n;
96 memcpy(pDest->a, pSrc->a, pDest->n*sizeof(pDest->a[0]));
97}
98
99/*
100** Try to insert a new prerequisite/cost entry into the WhereOrSet pSet.
101**
102** The new entry might overwrite an existing entry, or it might be
103** appended, or it might be discarded. Do whatever is the right thing
104** so that pSet keeps the N_OR_COST best entries seen so far.
105*/
106static int whereOrInsert(
107 WhereOrSet *pSet, /* The WhereOrSet to be updated */
108 Bitmask prereq, /* Prerequisites of the new entry */
drhbf539c42013-10-05 18:16:02 +0000109 LogEst rRun, /* Run-cost of the new entry */
110 LogEst nOut /* Number of outputs for the new entry */
drhaa32e3c2013-07-16 21:31:23 +0000111){
112 u16 i;
113 WhereOrCost *p;
114 for(i=pSet->n, p=pSet->a; i>0; i--, p++){
115 if( rRun<=p->rRun && (prereq & p->prereq)==prereq ){
116 goto whereOrInsert_done;
117 }
118 if( p->rRun<=rRun && (p->prereq & prereq)==p->prereq ){
119 return 0;
120 }
121 }
122 if( pSet->n<N_OR_COST ){
123 p = &pSet->a[pSet->n++];
124 p->nOut = nOut;
125 }else{
126 p = pSet->a;
127 for(i=1; i<pSet->n; i++){
128 if( p->rRun>pSet->a[i].rRun ) p = pSet->a + i;
129 }
130 if( p->rRun<=rRun ) return 0;
131 }
132whereOrInsert_done:
133 p->prereq = prereq;
134 p->rRun = rRun;
135 if( p->nOut>nOut ) p->nOut = nOut;
136 return 1;
137}
138
139/*
drh1398ad32005-01-19 23:24:50 +0000140** Return the bitmask for the given cursor number. Return 0 if
141** iCursor is not in the set.
drh6a3ea0e2003-05-02 14:32:12 +0000142*/
drh6f82e852015-06-06 20:12:09 +0000143Bitmask sqlite3WhereGetMask(WhereMaskSet *pMaskSet, int iCursor){
drh6a3ea0e2003-05-02 14:32:12 +0000144 int i;
drhfcd71b62011-04-05 22:08:24 +0000145 assert( pMaskSet->n<=(int)sizeof(Bitmask)*8 );
drh6a3ea0e2003-05-02 14:32:12 +0000146 for(i=0; i<pMaskSet->n; i++){
drh51669862004-12-18 18:40:26 +0000147 if( pMaskSet->ix[i]==iCursor ){
drh7699d1c2013-06-04 12:42:29 +0000148 return MASKBIT(i);
drh51669862004-12-18 18:40:26 +0000149 }
drh6a3ea0e2003-05-02 14:32:12 +0000150 }
drh6a3ea0e2003-05-02 14:32:12 +0000151 return 0;
152}
153
154/*
drh1398ad32005-01-19 23:24:50 +0000155** Create a new mask for cursor iCursor.
drh0fcef5e2005-07-19 17:38:22 +0000156**
157** There is one cursor per table in the FROM clause. The number of
158** tables in the FROM clause is limited by a test early in the
drhb6fb62d2005-09-20 08:47:20 +0000159** sqlite3WhereBegin() routine. So we know that the pMaskSet->ix[]
drh0fcef5e2005-07-19 17:38:22 +0000160** array will never overflow.
drh1398ad32005-01-19 23:24:50 +0000161*/
drh111a6a72008-12-21 03:51:16 +0000162static void createMask(WhereMaskSet *pMaskSet, int iCursor){
drhcad651e2007-04-20 12:22:01 +0000163 assert( pMaskSet->n < ArraySize(pMaskSet->ix) );
drh0fcef5e2005-07-19 17:38:22 +0000164 pMaskSet->ix[pMaskSet->n++] = iCursor;
drh1398ad32005-01-19 23:24:50 +0000165}
166
167/*
drh1c8148f2013-05-04 20:25:23 +0000168** Advance to the next WhereTerm that matches according to the criteria
169** established when the pScan object was initialized by whereScanInit().
170** Return NULL if there are no more matching WhereTerms.
171*/
danb2cfc142013-07-05 11:10:54 +0000172static WhereTerm *whereScanNext(WhereScan *pScan){
drh1c8148f2013-05-04 20:25:23 +0000173 int iCur; /* The cursor on the LHS of the term */
174 int iColumn; /* The column on the LHS of the term. -1 for IPK */
175 Expr *pX; /* An expression being tested */
176 WhereClause *pWC; /* Shorthand for pScan->pWC */
177 WhereTerm *pTerm; /* The term being tested */
drh43b85ef2013-06-10 12:34:45 +0000178 int k = pScan->k; /* Where to start scanning */
drh1c8148f2013-05-04 20:25:23 +0000179
180 while( pScan->iEquiv<=pScan->nEquiv ){
181 iCur = pScan->aEquiv[pScan->iEquiv-2];
182 iColumn = pScan->aEquiv[pScan->iEquiv-1];
183 while( (pWC = pScan->pWC)!=0 ){
drh43b85ef2013-06-10 12:34:45 +0000184 for(pTerm=pWC->a+k; k<pWC->nTerm; k++, pTerm++){
drhe1a086e2013-10-28 20:15:56 +0000185 if( pTerm->leftCursor==iCur
186 && pTerm->u.leftColumn==iColumn
187 && (pScan->iEquiv<=2 || !ExprHasProperty(pTerm->pExpr, EP_FromJoin))
188 ){
drh1c8148f2013-05-04 20:25:23 +0000189 if( (pTerm->eOperator & WO_EQUIV)!=0
190 && pScan->nEquiv<ArraySize(pScan->aEquiv)
191 ){
192 int j;
193 pX = sqlite3ExprSkipCollate(pTerm->pExpr->pRight);
194 assert( pX->op==TK_COLUMN );
195 for(j=0; j<pScan->nEquiv; j+=2){
196 if( pScan->aEquiv[j]==pX->iTable
197 && pScan->aEquiv[j+1]==pX->iColumn ){
198 break;
199 }
200 }
201 if( j==pScan->nEquiv ){
202 pScan->aEquiv[j] = pX->iTable;
203 pScan->aEquiv[j+1] = pX->iColumn;
204 pScan->nEquiv += 2;
205 }
206 }
207 if( (pTerm->eOperator & pScan->opMask)!=0 ){
208 /* Verify the affinity and collating sequence match */
209 if( pScan->zCollName && (pTerm->eOperator & WO_ISNULL)==0 ){
210 CollSeq *pColl;
drh70d18342013-06-06 19:16:33 +0000211 Parse *pParse = pWC->pWInfo->pParse;
drh1c8148f2013-05-04 20:25:23 +0000212 pX = pTerm->pExpr;
213 if( !sqlite3IndexAffinityOk(pX, pScan->idxaff) ){
214 continue;
215 }
216 assert(pX->pLeft);
drh70d18342013-06-06 19:16:33 +0000217 pColl = sqlite3BinaryCompareCollSeq(pParse,
drh1c8148f2013-05-04 20:25:23 +0000218 pX->pLeft, pX->pRight);
drh70d18342013-06-06 19:16:33 +0000219 if( pColl==0 ) pColl = pParse->db->pDfltColl;
drh1c8148f2013-05-04 20:25:23 +0000220 if( sqlite3StrICmp(pColl->zName, pScan->zCollName) ){
221 continue;
222 }
223 }
drhe8d0c612015-05-14 01:05:25 +0000224 if( (pTerm->eOperator & (WO_EQ|WO_IS))!=0
drha184fb82013-05-08 04:22:59 +0000225 && (pX = pTerm->pExpr->pRight)->op==TK_COLUMN
226 && pX->iTable==pScan->aEquiv[0]
227 && pX->iColumn==pScan->aEquiv[1]
228 ){
drhe8d0c612015-05-14 01:05:25 +0000229 testcase( pTerm->eOperator & WO_IS );
drha184fb82013-05-08 04:22:59 +0000230 continue;
231 }
drh43b85ef2013-06-10 12:34:45 +0000232 pScan->k = k+1;
drh1c8148f2013-05-04 20:25:23 +0000233 return pTerm;
234 }
235 }
236 }
drhad01d892013-06-19 13:59:49 +0000237 pScan->pWC = pScan->pWC->pOuter;
drh43b85ef2013-06-10 12:34:45 +0000238 k = 0;
drh1c8148f2013-05-04 20:25:23 +0000239 }
240 pScan->pWC = pScan->pOrigWC;
drh43b85ef2013-06-10 12:34:45 +0000241 k = 0;
drh1c8148f2013-05-04 20:25:23 +0000242 pScan->iEquiv += 2;
243 }
drh1c8148f2013-05-04 20:25:23 +0000244 return 0;
245}
246
247/*
248** Initialize a WHERE clause scanner object. Return a pointer to the
249** first match. Return NULL if there are no matches.
250**
251** The scanner will be searching the WHERE clause pWC. It will look
252** for terms of the form "X <op> <expr>" where X is column iColumn of table
253** iCur. The <op> must be one of the operators described by opMask.
254**
drh3b48e8c2013-06-12 20:18:16 +0000255** If the search is for X and the WHERE clause contains terms of the
256** form X=Y then this routine might also return terms of the form
257** "Y <op> <expr>". The number of levels of transitivity is limited,
258** but is enough to handle most commonly occurring SQL statements.
259**
drh1c8148f2013-05-04 20:25:23 +0000260** If X is not the INTEGER PRIMARY KEY then X must be compatible with
261** index pIdx.
262*/
danb2cfc142013-07-05 11:10:54 +0000263static WhereTerm *whereScanInit(
drh1c8148f2013-05-04 20:25:23 +0000264 WhereScan *pScan, /* The WhereScan object being initialized */
265 WhereClause *pWC, /* The WHERE clause to be scanned */
266 int iCur, /* Cursor to scan for */
267 int iColumn, /* Column to scan for */
268 u32 opMask, /* Operator(s) to scan for */
269 Index *pIdx /* Must be compatible with this index */
270){
271 int j;
272
drhe9d935a2013-06-05 16:19:59 +0000273 /* memset(pScan, 0, sizeof(*pScan)); */
drh1c8148f2013-05-04 20:25:23 +0000274 pScan->pOrigWC = pWC;
275 pScan->pWC = pWC;
276 if( pIdx && iColumn>=0 ){
277 pScan->idxaff = pIdx->pTable->aCol[iColumn].affinity;
278 for(j=0; pIdx->aiColumn[j]!=iColumn; j++){
dan39129ce2014-06-30 15:23:57 +0000279 if( NEVER(j>pIdx->nColumn) ) return 0;
drh1c8148f2013-05-04 20:25:23 +0000280 }
281 pScan->zCollName = pIdx->azColl[j];
drhe9d935a2013-06-05 16:19:59 +0000282 }else{
283 pScan->idxaff = 0;
284 pScan->zCollName = 0;
drh1c8148f2013-05-04 20:25:23 +0000285 }
286 pScan->opMask = opMask;
drhe9d935a2013-06-05 16:19:59 +0000287 pScan->k = 0;
drh1c8148f2013-05-04 20:25:23 +0000288 pScan->aEquiv[0] = iCur;
289 pScan->aEquiv[1] = iColumn;
290 pScan->nEquiv = 2;
291 pScan->iEquiv = 2;
292 return whereScanNext(pScan);
293}
294
295/*
drhfe05af82005-07-21 03:14:59 +0000296** Search for a term in the WHERE clause that is of the form "X <op> <expr>"
297** where X is a reference to the iColumn of table iCur and <op> is one of
298** the WO_xx operator codes specified by the op parameter.
299** Return a pointer to the term. Return 0 if not found.
drh58eb1c02013-01-17 00:08:42 +0000300**
301** The term returned might by Y=<expr> if there is another constraint in
302** the WHERE clause that specifies that X=Y. Any such constraints will be
303** identified by the WO_EQUIV bit in the pTerm->eOperator field. The
304** aEquiv[] array holds X and all its equivalents, with each SQL variable
305** taking up two slots in aEquiv[]. The first slot is for the cursor number
306** and the second is for the column number. There are 22 slots in aEquiv[]
307** so that means we can look for X plus up to 10 other equivalent values.
308** Hence a search for X will return <expr> if X=A1 and A1=A2 and A2=A3
309** and ... and A9=A10 and A10=<expr>.
310**
311** If there are multiple terms in the WHERE clause of the form "X <op> <expr>"
312** then try for the one with no dependencies on <expr> - in other words where
313** <expr> is a constant expression of some kind. Only return entries of
314** the form "X <op> Y" where Y is a column in another table if no terms of
drh459f63e2013-03-06 01:55:27 +0000315** the form "X <op> <const-expr>" exist. If no terms with a constant RHS
316** exist, try to return a term that does not use WO_EQUIV.
drhfe05af82005-07-21 03:14:59 +0000317*/
drh6f82e852015-06-06 20:12:09 +0000318WhereTerm *sqlite3WhereFindTerm(
drhfe05af82005-07-21 03:14:59 +0000319 WhereClause *pWC, /* The WHERE clause to be searched */
320 int iCur, /* Cursor number of LHS */
321 int iColumn, /* Column number of LHS */
322 Bitmask notReady, /* RHS must not overlap with this mask */
drhec1724e2008-12-09 01:32:03 +0000323 u32 op, /* Mask of WO_xx values describing operator */
drhfe05af82005-07-21 03:14:59 +0000324 Index *pIdx /* Must be compatible with this index, if not NULL */
325){
drh1c8148f2013-05-04 20:25:23 +0000326 WhereTerm *pResult = 0;
327 WhereTerm *p;
328 WhereScan scan;
drh7a5bcc02013-01-16 17:08:58 +0000329
drh1c8148f2013-05-04 20:25:23 +0000330 p = whereScanInit(&scan, pWC, iCur, iColumn, op, pIdx);
drhe8d0c612015-05-14 01:05:25 +0000331 op &= WO_EQ|WO_IS;
drh1c8148f2013-05-04 20:25:23 +0000332 while( p ){
333 if( (p->prereqRight & notReady)==0 ){
drhe8d0c612015-05-14 01:05:25 +0000334 if( p->prereqRight==0 && (p->eOperator&op)!=0 ){
335 testcase( p->eOperator & WO_IS );
drh1c8148f2013-05-04 20:25:23 +0000336 return p;
drhfe05af82005-07-21 03:14:59 +0000337 }
drh1c8148f2013-05-04 20:25:23 +0000338 if( pResult==0 ) pResult = p;
drhfe05af82005-07-21 03:14:59 +0000339 }
drh1c8148f2013-05-04 20:25:23 +0000340 p = whereScanNext(&scan);
drhfe05af82005-07-21 03:14:59 +0000341 }
drh7a5bcc02013-01-16 17:08:58 +0000342 return pResult;
drhfe05af82005-07-21 03:14:59 +0000343}
344
drh7b4fc6a2007-02-06 13:26:32 +0000345/*
peter.d.reid60ec9142014-09-06 16:39:46 +0000346** This function searches pList for an entry that matches the iCol-th column
drh3b48e8c2013-06-12 20:18:16 +0000347** of index pIdx.
dan6f343962011-07-01 18:26:40 +0000348**
349** If such an expression is found, its index in pList->a[] is returned. If
350** no expression is found, -1 is returned.
351*/
352static int findIndexCol(
353 Parse *pParse, /* Parse context */
354 ExprList *pList, /* Expression list to search */
355 int iBase, /* Cursor for table associated with pIdx */
356 Index *pIdx, /* Index to match column of */
357 int iCol /* Column of index to match */
358){
359 int i;
360 const char *zColl = pIdx->azColl[iCol];
361
362 for(i=0; i<pList->nExpr; i++){
drh580c8c12012-12-08 03:34:04 +0000363 Expr *p = sqlite3ExprSkipCollate(pList->a[i].pExpr);
drhf1d3e322011-07-09 13:00:41 +0000364 if( p->op==TK_COLUMN
365 && p->iColumn==pIdx->aiColumn[iCol]
366 && p->iTable==iBase
367 ){
drh580c8c12012-12-08 03:34:04 +0000368 CollSeq *pColl = sqlite3ExprCollSeq(pParse, pList->a[i].pExpr);
drh65df68e2015-04-15 05:31:02 +0000369 if( pColl && 0==sqlite3StrICmp(pColl->zName, zColl) ){
dan6f343962011-07-01 18:26:40 +0000370 return i;
371 }
372 }
373 }
374
375 return -1;
376}
377
378/*
dan6f343962011-07-01 18:26:40 +0000379** Return true if the DISTINCT expression-list passed as the third argument
drh4f402f22013-06-11 18:59:38 +0000380** is redundant.
381**
drhb121dd12015-06-06 18:30:17 +0000382** A DISTINCT list is redundant if any subset of the columns in the
383** DISTINCT list are collectively unique and individually non-null.
dan6f343962011-07-01 18:26:40 +0000384*/
385static int isDistinctRedundant(
drh4f402f22013-06-11 18:59:38 +0000386 Parse *pParse, /* Parsing context */
387 SrcList *pTabList, /* The FROM clause */
388 WhereClause *pWC, /* The WHERE clause */
389 ExprList *pDistinct /* The result set that needs to be DISTINCT */
dan6f343962011-07-01 18:26:40 +0000390){
391 Table *pTab;
392 Index *pIdx;
393 int i;
394 int iBase;
395
396 /* If there is more than one table or sub-select in the FROM clause of
397 ** this query, then it will not be possible to show that the DISTINCT
398 ** clause is redundant. */
399 if( pTabList->nSrc!=1 ) return 0;
400 iBase = pTabList->a[0].iCursor;
401 pTab = pTabList->a[0].pTab;
402
dan94e08d92011-07-02 06:44:05 +0000403 /* If any of the expressions is an IPK column on table iBase, then return
404 ** true. Note: The (p->iTable==iBase) part of this test may be false if the
405 ** current SELECT is a correlated sub-query.
406 */
dan6f343962011-07-01 18:26:40 +0000407 for(i=0; i<pDistinct->nExpr; i++){
drh580c8c12012-12-08 03:34:04 +0000408 Expr *p = sqlite3ExprSkipCollate(pDistinct->a[i].pExpr);
dan94e08d92011-07-02 06:44:05 +0000409 if( p->op==TK_COLUMN && p->iTable==iBase && p->iColumn<0 ) return 1;
dan6f343962011-07-01 18:26:40 +0000410 }
411
412 /* Loop through all indices on the table, checking each to see if it makes
413 ** the DISTINCT qualifier redundant. It does so if:
414 **
415 ** 1. The index is itself UNIQUE, and
416 **
417 ** 2. All of the columns in the index are either part of the pDistinct
418 ** list, or else the WHERE clause contains a term of the form "col=X",
419 ** where X is a constant value. The collation sequences of the
420 ** comparison and select-list expressions must match those of the index.
dan6a36f432012-04-20 16:59:24 +0000421 **
422 ** 3. All of those index columns for which the WHERE clause does not
423 ** contain a "col=X" term are subject to a NOT NULL constraint.
dan6f343962011-07-01 18:26:40 +0000424 */
425 for(pIdx=pTab->pIndex; pIdx; pIdx=pIdx->pNext){
drh5f1d1d92014-07-31 22:59:04 +0000426 if( !IsUniqueIndex(pIdx) ) continue;
drhbbbdc832013-10-22 18:01:40 +0000427 for(i=0; i<pIdx->nKeyCol; i++){
428 i16 iCol = pIdx->aiColumn[i];
drh6f82e852015-06-06 20:12:09 +0000429 if( 0==sqlite3WhereFindTerm(pWC, iBase, iCol, ~(Bitmask)0, WO_EQ, pIdx) ){
dan6a36f432012-04-20 16:59:24 +0000430 int iIdxCol = findIndexCol(pParse, pDistinct, iBase, pIdx, i);
drhbbbdc832013-10-22 18:01:40 +0000431 if( iIdxCol<0 || pTab->aCol[iCol].notNull==0 ){
dan6a36f432012-04-20 16:59:24 +0000432 break;
433 }
dan6f343962011-07-01 18:26:40 +0000434 }
435 }
drhbbbdc832013-10-22 18:01:40 +0000436 if( i==pIdx->nKeyCol ){
dan6f343962011-07-01 18:26:40 +0000437 /* This index implies that the DISTINCT qualifier is redundant. */
438 return 1;
439 }
440 }
441
442 return 0;
443}
drh0fcef5e2005-07-19 17:38:22 +0000444
drh8636e9c2013-06-11 01:50:08 +0000445
drh75897232000-05-29 14:26:00 +0000446/*
drh3b48e8c2013-06-12 20:18:16 +0000447** Estimate the logarithm of the input value to base 2.
drh28c4cf42005-07-27 20:41:43 +0000448*/
drhbf539c42013-10-05 18:16:02 +0000449static LogEst estLog(LogEst N){
drh696964d2014-06-12 15:46:46 +0000450 return N<=10 ? 0 : sqlite3LogEst(N) - 33;
drh28c4cf42005-07-27 20:41:43 +0000451}
452
drh6d209d82006-06-27 01:54:26 +0000453/*
drh7b3aa082015-05-29 13:55:33 +0000454** Convert OP_Column opcodes to OP_Copy in previously generated code.
455**
456** This routine runs over generated VDBE code and translates OP_Column
457** opcodes into OP_Copy, and OP_Rowid into OP_Null, when the table is being
458** accessed via co-routine instead of via table lookup.
459*/
460static void translateColumnToCopy(
461 Vdbe *v, /* The VDBE containing code to translate */
462 int iStart, /* Translate from this opcode to the end */
463 int iTabCur, /* OP_Column/OP_Rowid references to this table */
464 int iRegister /* The first column is in this register */
465){
466 VdbeOp *pOp = sqlite3VdbeGetOp(v, iStart);
467 int iEnd = sqlite3VdbeCurrentAddr(v);
468 for(; iStart<iEnd; iStart++, pOp++){
469 if( pOp->p1!=iTabCur ) continue;
470 if( pOp->opcode==OP_Column ){
471 pOp->opcode = OP_Copy;
472 pOp->p1 = pOp->p2 + iRegister;
473 pOp->p2 = pOp->p3;
474 pOp->p3 = 0;
475 }else if( pOp->opcode==OP_Rowid ){
476 pOp->opcode = OP_Null;
477 pOp->p1 = 0;
478 pOp->p3 = 0;
479 }
480 }
481}
482
483/*
drh6d209d82006-06-27 01:54:26 +0000484** Two routines for printing the content of an sqlite3_index_info
485** structure. Used for testing and debugging only. If neither
486** SQLITE_TEST or SQLITE_DEBUG are defined, then these routines
487** are no-ops.
488*/
drhd15cb172013-05-21 19:23:10 +0000489#if !defined(SQLITE_OMIT_VIRTUALTABLE) && defined(WHERETRACE_ENABLED)
drh6d209d82006-06-27 01:54:26 +0000490static void TRACE_IDX_INPUTS(sqlite3_index_info *p){
491 int i;
mlcreech3a00f902008-03-04 17:45:01 +0000492 if( !sqlite3WhereTrace ) return;
drh6d209d82006-06-27 01:54:26 +0000493 for(i=0; i<p->nConstraint; i++){
494 sqlite3DebugPrintf(" constraint[%d]: col=%d termid=%d op=%d usabled=%d\n",
495 i,
496 p->aConstraint[i].iColumn,
497 p->aConstraint[i].iTermOffset,
498 p->aConstraint[i].op,
499 p->aConstraint[i].usable);
500 }
501 for(i=0; i<p->nOrderBy; i++){
502 sqlite3DebugPrintf(" orderby[%d]: col=%d desc=%d\n",
503 i,
504 p->aOrderBy[i].iColumn,
505 p->aOrderBy[i].desc);
506 }
507}
508static void TRACE_IDX_OUTPUTS(sqlite3_index_info *p){
509 int i;
mlcreech3a00f902008-03-04 17:45:01 +0000510 if( !sqlite3WhereTrace ) return;
drh6d209d82006-06-27 01:54:26 +0000511 for(i=0; i<p->nConstraint; i++){
512 sqlite3DebugPrintf(" usage[%d]: argvIdx=%d omit=%d\n",
513 i,
514 p->aConstraintUsage[i].argvIndex,
515 p->aConstraintUsage[i].omit);
516 }
517 sqlite3DebugPrintf(" idxNum=%d\n", p->idxNum);
518 sqlite3DebugPrintf(" idxStr=%s\n", p->idxStr);
519 sqlite3DebugPrintf(" orderByConsumed=%d\n", p->orderByConsumed);
520 sqlite3DebugPrintf(" estimatedCost=%g\n", p->estimatedCost);
dana9f58152013-11-11 19:01:33 +0000521 sqlite3DebugPrintf(" estimatedRows=%lld\n", p->estimatedRows);
drh6d209d82006-06-27 01:54:26 +0000522}
523#else
524#define TRACE_IDX_INPUTS(A)
525#define TRACE_IDX_OUTPUTS(A)
526#endif
527
drhc6339082010-04-07 16:54:58 +0000528#ifndef SQLITE_OMIT_AUTOMATIC_INDEX
drh8b307fb2010-04-06 15:57:05 +0000529/*
drh4139c992010-04-07 14:59:45 +0000530** Return TRUE if the WHERE clause term pTerm is of a form where it
531** could be used with an index to access pSrc, assuming an appropriate
532** index existed.
533*/
534static int termCanDriveIndex(
535 WhereTerm *pTerm, /* WHERE clause term to check */
536 struct SrcList_item *pSrc, /* Table we are trying to access */
537 Bitmask notReady /* Tables in outer loops of the join */
538){
539 char aff;
540 if( pTerm->leftCursor!=pSrc->iCursor ) return 0;
drhe8d0c612015-05-14 01:05:25 +0000541 if( (pTerm->eOperator & (WO_EQ|WO_IS))==0 ) return 0;
drh4139c992010-04-07 14:59:45 +0000542 if( (pTerm->prereqRight & notReady)!=0 ) return 0;
drh23f98da2013-05-21 15:52:07 +0000543 if( pTerm->u.leftColumn<0 ) return 0;
drh4139c992010-04-07 14:59:45 +0000544 aff = pSrc->pTab->aCol[pTerm->u.leftColumn].affinity;
545 if( !sqlite3IndexAffinityOk(pTerm->pExpr, aff) ) return 0;
drhe0cc3c22015-05-13 17:54:08 +0000546 testcase( pTerm->pExpr->op==TK_IS );
drh4139c992010-04-07 14:59:45 +0000547 return 1;
548}
drhc6339082010-04-07 16:54:58 +0000549#endif
drh4139c992010-04-07 14:59:45 +0000550
drhc6339082010-04-07 16:54:58 +0000551
552#ifndef SQLITE_OMIT_AUTOMATIC_INDEX
drh8b307fb2010-04-06 15:57:05 +0000553/*
drhc6339082010-04-07 16:54:58 +0000554** Generate code to construct the Index object for an automatic index
555** and to set up the WhereLevel object pLevel so that the code generator
556** makes use of the automatic index.
drh8b307fb2010-04-06 15:57:05 +0000557*/
drhc6339082010-04-07 16:54:58 +0000558static void constructAutomaticIndex(
drh8b307fb2010-04-06 15:57:05 +0000559 Parse *pParse, /* The parsing context */
560 WhereClause *pWC, /* The WHERE clause */
561 struct SrcList_item *pSrc, /* The FROM clause term to get the next index */
562 Bitmask notReady, /* Mask of cursors that are not available */
563 WhereLevel *pLevel /* Write new index here */
564){
drhbbbdc832013-10-22 18:01:40 +0000565 int nKeyCol; /* Number of columns in the constructed index */
drh8b307fb2010-04-06 15:57:05 +0000566 WhereTerm *pTerm; /* A single term of the WHERE clause */
567 WhereTerm *pWCEnd; /* End of pWC->a[] */
drh8b307fb2010-04-06 15:57:05 +0000568 Index *pIdx; /* Object describing the transient index */
569 Vdbe *v; /* Prepared statement under construction */
drh8b307fb2010-04-06 15:57:05 +0000570 int addrInit; /* Address of the initialization bypass jump */
571 Table *pTable; /* The table being indexed */
drh8b307fb2010-04-06 15:57:05 +0000572 int addrTop; /* Top of the index fill loop */
573 int regRecord; /* Register holding an index record */
574 int n; /* Column counter */
drh4139c992010-04-07 14:59:45 +0000575 int i; /* Loop counter */
576 int mxBitCol; /* Maximum column in pSrc->colUsed */
drh424aab82010-04-06 18:28:20 +0000577 CollSeq *pColl; /* Collating sequence to on a column */
drh7ba39a92013-05-30 17:43:19 +0000578 WhereLoop *pLoop; /* The Loop object */
drh77e57df2013-10-22 14:28:02 +0000579 char *zNotUsed; /* Extra space on the end of pIdx */
drh4139c992010-04-07 14:59:45 +0000580 Bitmask idxCols; /* Bitmap of columns used for indexing */
581 Bitmask extraCols; /* Bitmap of additional columns */
drh8d56e202013-06-28 23:55:45 +0000582 u8 sentWarning = 0; /* True if a warnning has been issued */
drh059b2d52014-10-24 19:28:09 +0000583 Expr *pPartial = 0; /* Partial Index Expression */
584 int iContinue = 0; /* Jump here to skip excluded rows */
drh7b3aa082015-05-29 13:55:33 +0000585 struct SrcList_item *pTabItem; /* FROM clause term being indexed */
drh8b307fb2010-04-06 15:57:05 +0000586
587 /* Generate code to skip over the creation and initialization of the
588 ** transient index on 2nd and subsequent iterations of the loop. */
589 v = pParse->pVdbe;
590 assert( v!=0 );
drh7d176102014-02-18 03:07:12 +0000591 addrInit = sqlite3CodeOnce(pParse); VdbeCoverage(v);
drh8b307fb2010-04-06 15:57:05 +0000592
drh4139c992010-04-07 14:59:45 +0000593 /* Count the number of columns that will be added to the index
594 ** and used to match WHERE clause constraints */
drhbbbdc832013-10-22 18:01:40 +0000595 nKeyCol = 0;
drh424aab82010-04-06 18:28:20 +0000596 pTable = pSrc->pTab;
drh8b307fb2010-04-06 15:57:05 +0000597 pWCEnd = &pWC->a[pWC->nTerm];
drh7ba39a92013-05-30 17:43:19 +0000598 pLoop = pLevel->pWLoop;
drh4139c992010-04-07 14:59:45 +0000599 idxCols = 0;
drh81186b42013-06-18 01:52:41 +0000600 for(pTerm=pWC->a; pTerm<pWCEnd; pTerm++){
drh13cc90c2015-02-25 00:24:41 +0000601 Expr *pExpr = pTerm->pExpr;
602 assert( !ExprHasProperty(pExpr, EP_FromJoin) /* prereq always non-zero */
603 || pExpr->iRightJoinTable!=pSrc->iCursor /* for the right-hand */
604 || pLoop->prereq!=0 ); /* table of a LEFT JOIN */
drh059b2d52014-10-24 19:28:09 +0000605 if( pLoop->prereq==0
drh051575c2014-10-25 12:28:25 +0000606 && (pTerm->wtFlags & TERM_VIRTUAL)==0
drh13cc90c2015-02-25 00:24:41 +0000607 && !ExprHasProperty(pExpr, EP_FromJoin)
608 && sqlite3ExprIsTableConstant(pExpr, pSrc->iCursor) ){
drh059b2d52014-10-24 19:28:09 +0000609 pPartial = sqlite3ExprAnd(pParse->db, pPartial,
drh13cc90c2015-02-25 00:24:41 +0000610 sqlite3ExprDup(pParse->db, pExpr, 0));
drh059b2d52014-10-24 19:28:09 +0000611 }
drh4139c992010-04-07 14:59:45 +0000612 if( termCanDriveIndex(pTerm, pSrc, notReady) ){
613 int iCol = pTerm->u.leftColumn;
drh7699d1c2013-06-04 12:42:29 +0000614 Bitmask cMask = iCol>=BMS ? MASKBIT(BMS-1) : MASKBIT(iCol);
drh52ff8ea2010-04-08 14:15:56 +0000615 testcase( iCol==BMS );
616 testcase( iCol==BMS-1 );
drh8d56e202013-06-28 23:55:45 +0000617 if( !sentWarning ){
618 sqlite3_log(SQLITE_WARNING_AUTOINDEX,
619 "automatic index on %s(%s)", pTable->zName,
620 pTable->aCol[iCol].zName);
621 sentWarning = 1;
622 }
drh0013e722010-04-08 00:40:15 +0000623 if( (idxCols & cMask)==0 ){
drh059b2d52014-10-24 19:28:09 +0000624 if( whereLoopResize(pParse->db, pLoop, nKeyCol+1) ){
625 goto end_auto_index_create;
626 }
drhbbbdc832013-10-22 18:01:40 +0000627 pLoop->aLTerm[nKeyCol++] = pTerm;
drh0013e722010-04-08 00:40:15 +0000628 idxCols |= cMask;
629 }
drh8b307fb2010-04-06 15:57:05 +0000630 }
631 }
drhbbbdc832013-10-22 18:01:40 +0000632 assert( nKeyCol>0 );
633 pLoop->u.btree.nEq = pLoop->nLTerm = nKeyCol;
drh53b52f72013-05-31 11:57:39 +0000634 pLoop->wsFlags = WHERE_COLUMN_EQ | WHERE_IDX_ONLY | WHERE_INDEXED
drh986b3872013-06-28 21:12:20 +0000635 | WHERE_AUTO_INDEX;
drh4139c992010-04-07 14:59:45 +0000636
637 /* Count the number of additional columns needed to create a
638 ** covering index. A "covering index" is an index that contains all
639 ** columns that are needed by the query. With a covering index, the
640 ** original table never needs to be accessed. Automatic indices must
641 ** be a covering index because the index will not be updated if the
642 ** original table changes and the index and table cannot both be used
643 ** if they go out of sync.
644 */
drh7699d1c2013-06-04 12:42:29 +0000645 extraCols = pSrc->colUsed & (~idxCols | MASKBIT(BMS-1));
drhc3ef4fa2014-10-28 15:58:50 +0000646 mxBitCol = MIN(BMS-1,pTable->nCol);
drh52ff8ea2010-04-08 14:15:56 +0000647 testcase( pTable->nCol==BMS-1 );
648 testcase( pTable->nCol==BMS-2 );
drh4139c992010-04-07 14:59:45 +0000649 for(i=0; i<mxBitCol; i++){
drhbbbdc832013-10-22 18:01:40 +0000650 if( extraCols & MASKBIT(i) ) nKeyCol++;
drh4139c992010-04-07 14:59:45 +0000651 }
drh7699d1c2013-06-04 12:42:29 +0000652 if( pSrc->colUsed & MASKBIT(BMS-1) ){
drhbbbdc832013-10-22 18:01:40 +0000653 nKeyCol += pTable->nCol - BMS + 1;
drh4139c992010-04-07 14:59:45 +0000654 }
drh8b307fb2010-04-06 15:57:05 +0000655
656 /* Construct the Index object to describe this index */
drhbbbdc832013-10-22 18:01:40 +0000657 pIdx = sqlite3AllocateIndexObject(pParse->db, nKeyCol+1, 0, &zNotUsed);
drh059b2d52014-10-24 19:28:09 +0000658 if( pIdx==0 ) goto end_auto_index_create;
drh7ba39a92013-05-30 17:43:19 +0000659 pLoop->u.btree.pIndex = pIdx;
drh8b307fb2010-04-06 15:57:05 +0000660 pIdx->zName = "auto-index";
drh424aab82010-04-06 18:28:20 +0000661 pIdx->pTable = pTable;
drh8b307fb2010-04-06 15:57:05 +0000662 n = 0;
drh0013e722010-04-08 00:40:15 +0000663 idxCols = 0;
drh8b307fb2010-04-06 15:57:05 +0000664 for(pTerm=pWC->a; pTerm<pWCEnd; pTerm++){
drh4139c992010-04-07 14:59:45 +0000665 if( termCanDriveIndex(pTerm, pSrc, notReady) ){
drh0013e722010-04-08 00:40:15 +0000666 int iCol = pTerm->u.leftColumn;
drh7699d1c2013-06-04 12:42:29 +0000667 Bitmask cMask = iCol>=BMS ? MASKBIT(BMS-1) : MASKBIT(iCol);
drh7963b0e2013-06-17 21:37:40 +0000668 testcase( iCol==BMS-1 );
669 testcase( iCol==BMS );
drh0013e722010-04-08 00:40:15 +0000670 if( (idxCols & cMask)==0 ){
671 Expr *pX = pTerm->pExpr;
672 idxCols |= cMask;
673 pIdx->aiColumn[n] = pTerm->u.leftColumn;
674 pColl = sqlite3BinaryCompareCollSeq(pParse, pX->pLeft, pX->pRight);
drh29031832015-04-15 07:34:25 +0000675 pIdx->azColl[n] = pColl ? pColl->zName : "BINARY";
drh0013e722010-04-08 00:40:15 +0000676 n++;
677 }
drh8b307fb2010-04-06 15:57:05 +0000678 }
679 }
drh7ba39a92013-05-30 17:43:19 +0000680 assert( (u32)n==pLoop->u.btree.nEq );
drh4139c992010-04-07 14:59:45 +0000681
drhc6339082010-04-07 16:54:58 +0000682 /* Add additional columns needed to make the automatic index into
683 ** a covering index */
drh4139c992010-04-07 14:59:45 +0000684 for(i=0; i<mxBitCol; i++){
drh7699d1c2013-06-04 12:42:29 +0000685 if( extraCols & MASKBIT(i) ){
drh4139c992010-04-07 14:59:45 +0000686 pIdx->aiColumn[n] = i;
687 pIdx->azColl[n] = "BINARY";
688 n++;
689 }
690 }
drh7699d1c2013-06-04 12:42:29 +0000691 if( pSrc->colUsed & MASKBIT(BMS-1) ){
drh4139c992010-04-07 14:59:45 +0000692 for(i=BMS-1; i<pTable->nCol; i++){
693 pIdx->aiColumn[n] = i;
694 pIdx->azColl[n] = "BINARY";
695 n++;
696 }
697 }
drhbbbdc832013-10-22 18:01:40 +0000698 assert( n==nKeyCol );
drh44156282013-10-23 22:23:03 +0000699 pIdx->aiColumn[n] = -1;
700 pIdx->azColl[n] = "BINARY";
drh8b307fb2010-04-06 15:57:05 +0000701
drhc6339082010-04-07 16:54:58 +0000702 /* Create the automatic index */
drh8b307fb2010-04-06 15:57:05 +0000703 assert( pLevel->iIdxCur>=0 );
drha1f41242013-05-31 20:00:58 +0000704 pLevel->iIdxCur = pParse->nTab++;
drh2ec2fb22013-11-06 19:59:23 +0000705 sqlite3VdbeAddOp2(v, OP_OpenAutoindex, pLevel->iIdxCur, nKeyCol+1);
706 sqlite3VdbeSetP4KeyInfo(pParse, pIdx);
drha21a64d2010-04-06 22:33:55 +0000707 VdbeComment((v, "for %s", pTable->zName));
drh8b307fb2010-04-06 15:57:05 +0000708
drhc6339082010-04-07 16:54:58 +0000709 /* Fill the automatic index with content */
drh059b2d52014-10-24 19:28:09 +0000710 sqlite3ExprCachePush(pParse);
drh7b3aa082015-05-29 13:55:33 +0000711 pTabItem = &pWC->pWInfo->pTabList->a[pLevel->iFrom];
drh8a48b9c2015-08-19 15:20:00 +0000712 if( pTabItem->fg.viaCoroutine ){
drh7b3aa082015-05-29 13:55:33 +0000713 int regYield = pTabItem->regReturn;
714 sqlite3VdbeAddOp3(v, OP_InitCoroutine, regYield, 0, pTabItem->addrFillSub);
715 addrTop = sqlite3VdbeAddOp1(v, OP_Yield, regYield);
716 VdbeCoverage(v);
717 VdbeComment((v, "next row of \"%s\"", pTabItem->pTab->zName));
718 }else{
719 addrTop = sqlite3VdbeAddOp1(v, OP_Rewind, pLevel->iTabCur); VdbeCoverage(v);
720 }
drh059b2d52014-10-24 19:28:09 +0000721 if( pPartial ){
722 iContinue = sqlite3VdbeMakeLabel(v);
723 sqlite3ExprIfFalse(pParse, pPartial, iContinue, SQLITE_JUMPIFNULL);
drh051575c2014-10-25 12:28:25 +0000724 pLoop->wsFlags |= WHERE_PARTIALIDX;
drh059b2d52014-10-24 19:28:09 +0000725 }
drh8b307fb2010-04-06 15:57:05 +0000726 regRecord = sqlite3GetTempReg(pParse);
drh1c2c0b72014-01-04 19:27:05 +0000727 sqlite3GenerateIndexKey(pParse, pIdx, pLevel->iTabCur, regRecord, 0, 0, 0, 0);
drh8b307fb2010-04-06 15:57:05 +0000728 sqlite3VdbeAddOp2(v, OP_IdxInsert, pLevel->iIdxCur, regRecord);
729 sqlite3VdbeChangeP5(v, OPFLAG_USESEEKRESULT);
drh059b2d52014-10-24 19:28:09 +0000730 if( pPartial ) sqlite3VdbeResolveLabel(v, iContinue);
drh8a48b9c2015-08-19 15:20:00 +0000731 if( pTabItem->fg.viaCoroutine ){
drh7b3aa082015-05-29 13:55:33 +0000732 translateColumnToCopy(v, addrTop, pLevel->iTabCur, pTabItem->regResult);
733 sqlite3VdbeAddOp2(v, OP_Goto, 0, addrTop);
drh8a48b9c2015-08-19 15:20:00 +0000734 pTabItem->fg.viaCoroutine = 0;
drh7b3aa082015-05-29 13:55:33 +0000735 }else{
736 sqlite3VdbeAddOp2(v, OP_Next, pLevel->iTabCur, addrTop+1); VdbeCoverage(v);
737 }
drha21a64d2010-04-06 22:33:55 +0000738 sqlite3VdbeChangeP5(v, SQLITE_STMTSTATUS_AUTOINDEX);
drh8b307fb2010-04-06 15:57:05 +0000739 sqlite3VdbeJumpHere(v, addrTop);
740 sqlite3ReleaseTempReg(pParse, regRecord);
drh059b2d52014-10-24 19:28:09 +0000741 sqlite3ExprCachePop(pParse);
drh8b307fb2010-04-06 15:57:05 +0000742
743 /* Jump here when skipping the initialization */
744 sqlite3VdbeJumpHere(v, addrInit);
drh059b2d52014-10-24 19:28:09 +0000745
746end_auto_index_create:
747 sqlite3ExprDelete(pParse->db, pPartial);
drh8b307fb2010-04-06 15:57:05 +0000748}
drhc6339082010-04-07 16:54:58 +0000749#endif /* SQLITE_OMIT_AUTOMATIC_INDEX */
drh8b307fb2010-04-06 15:57:05 +0000750
drh9eff6162006-06-12 21:59:13 +0000751#ifndef SQLITE_OMIT_VIRTUALTABLE
752/*
danielk19771d461462009-04-21 09:02:45 +0000753** Allocate and populate an sqlite3_index_info structure. It is the
754** responsibility of the caller to eventually release the structure
755** by passing the pointer returned by this function to sqlite3_free().
756*/
drh5346e952013-05-08 14:14:26 +0000757static sqlite3_index_info *allocateIndexInfo(
758 Parse *pParse,
759 WhereClause *pWC,
dan4f20cd42015-06-08 18:05:54 +0000760 Bitmask mUnusable, /* Ignore terms with these prereqs */
drh5346e952013-05-08 14:14:26 +0000761 struct SrcList_item *pSrc,
762 ExprList *pOrderBy
763){
danielk19771d461462009-04-21 09:02:45 +0000764 int i, j;
765 int nTerm;
766 struct sqlite3_index_constraint *pIdxCons;
767 struct sqlite3_index_orderby *pIdxOrderBy;
768 struct sqlite3_index_constraint_usage *pUsage;
769 WhereTerm *pTerm;
770 int nOrderBy;
771 sqlite3_index_info *pIdxInfo;
772
danielk19771d461462009-04-21 09:02:45 +0000773 /* Count the number of possible WHERE clause constraints referring
774 ** to this virtual table */
775 for(i=nTerm=0, pTerm=pWC->a; i<pWC->nTerm; i++, pTerm++){
776 if( pTerm->leftCursor != pSrc->iCursor ) continue;
dan4f20cd42015-06-08 18:05:54 +0000777 if( pTerm->prereqRight & mUnusable ) continue;
drh7a5bcc02013-01-16 17:08:58 +0000778 assert( IsPowerOfTwo(pTerm->eOperator & ~WO_EQUIV) );
779 testcase( pTerm->eOperator & WO_IN );
780 testcase( pTerm->eOperator & WO_ISNULL );
drhee145872015-05-14 13:18:47 +0000781 testcase( pTerm->eOperator & WO_IS );
dana4ff8252014-01-20 19:55:33 +0000782 testcase( pTerm->eOperator & WO_ALL );
drhee145872015-05-14 13:18:47 +0000783 if( (pTerm->eOperator & ~(WO_ISNULL|WO_EQUIV|WO_IS))==0 ) continue;
drhb4256992011-08-02 01:57:39 +0000784 if( pTerm->wtFlags & TERM_VNULL ) continue;
danielk19771d461462009-04-21 09:02:45 +0000785 nTerm++;
786 }
787
788 /* If the ORDER BY clause contains only columns in the current
789 ** virtual table then allocate space for the aOrderBy part of
790 ** the sqlite3_index_info structure.
791 */
792 nOrderBy = 0;
793 if( pOrderBy ){
drh56f1b992012-09-25 14:29:39 +0000794 int n = pOrderBy->nExpr;
795 for(i=0; i<n; i++){
danielk19771d461462009-04-21 09:02:45 +0000796 Expr *pExpr = pOrderBy->a[i].pExpr;
797 if( pExpr->op!=TK_COLUMN || pExpr->iTable!=pSrc->iCursor ) break;
798 }
drh56f1b992012-09-25 14:29:39 +0000799 if( i==n){
800 nOrderBy = n;
danielk19771d461462009-04-21 09:02:45 +0000801 }
802 }
803
804 /* Allocate the sqlite3_index_info structure
805 */
806 pIdxInfo = sqlite3DbMallocZero(pParse->db, sizeof(*pIdxInfo)
807 + (sizeof(*pIdxCons) + sizeof(*pUsage))*nTerm
808 + sizeof(*pIdxOrderBy)*nOrderBy );
809 if( pIdxInfo==0 ){
810 sqlite3ErrorMsg(pParse, "out of memory");
danielk19771d461462009-04-21 09:02:45 +0000811 return 0;
812 }
813
814 /* Initialize the structure. The sqlite3_index_info structure contains
815 ** many fields that are declared "const" to prevent xBestIndex from
816 ** changing them. We have to do some funky casting in order to
817 ** initialize those fields.
818 */
819 pIdxCons = (struct sqlite3_index_constraint*)&pIdxInfo[1];
820 pIdxOrderBy = (struct sqlite3_index_orderby*)&pIdxCons[nTerm];
821 pUsage = (struct sqlite3_index_constraint_usage*)&pIdxOrderBy[nOrderBy];
822 *(int*)&pIdxInfo->nConstraint = nTerm;
823 *(int*)&pIdxInfo->nOrderBy = nOrderBy;
824 *(struct sqlite3_index_constraint**)&pIdxInfo->aConstraint = pIdxCons;
825 *(struct sqlite3_index_orderby**)&pIdxInfo->aOrderBy = pIdxOrderBy;
826 *(struct sqlite3_index_constraint_usage**)&pIdxInfo->aConstraintUsage =
827 pUsage;
828
829 for(i=j=0, pTerm=pWC->a; i<pWC->nTerm; i++, pTerm++){
drh281bbe22012-10-16 23:17:14 +0000830 u8 op;
danielk19771d461462009-04-21 09:02:45 +0000831 if( pTerm->leftCursor != pSrc->iCursor ) continue;
dan4f20cd42015-06-08 18:05:54 +0000832 if( pTerm->prereqRight & mUnusable ) continue;
drh7a5bcc02013-01-16 17:08:58 +0000833 assert( IsPowerOfTwo(pTerm->eOperator & ~WO_EQUIV) );
834 testcase( pTerm->eOperator & WO_IN );
drhee145872015-05-14 13:18:47 +0000835 testcase( pTerm->eOperator & WO_IS );
drh7a5bcc02013-01-16 17:08:58 +0000836 testcase( pTerm->eOperator & WO_ISNULL );
dana4ff8252014-01-20 19:55:33 +0000837 testcase( pTerm->eOperator & WO_ALL );
drhe8d0c612015-05-14 01:05:25 +0000838 if( (pTerm->eOperator & ~(WO_ISNULL|WO_EQUIV|WO_IS))==0 ) continue;
drhb4256992011-08-02 01:57:39 +0000839 if( pTerm->wtFlags & TERM_VNULL ) continue;
danielk19771d461462009-04-21 09:02:45 +0000840 pIdxCons[j].iColumn = pTerm->u.leftColumn;
841 pIdxCons[j].iTermOffset = i;
drh7a5bcc02013-01-16 17:08:58 +0000842 op = (u8)pTerm->eOperator & WO_ALL;
drh281bbe22012-10-16 23:17:14 +0000843 if( op==WO_IN ) op = WO_EQ;
844 pIdxCons[j].op = op;
danielk19771d461462009-04-21 09:02:45 +0000845 /* The direct assignment in the previous line is possible only because
846 ** the WO_ and SQLITE_INDEX_CONSTRAINT_ codes are identical. The
847 ** following asserts verify this fact. */
848 assert( WO_EQ==SQLITE_INDEX_CONSTRAINT_EQ );
849 assert( WO_LT==SQLITE_INDEX_CONSTRAINT_LT );
850 assert( WO_LE==SQLITE_INDEX_CONSTRAINT_LE );
851 assert( WO_GT==SQLITE_INDEX_CONSTRAINT_GT );
852 assert( WO_GE==SQLITE_INDEX_CONSTRAINT_GE );
853 assert( WO_MATCH==SQLITE_INDEX_CONSTRAINT_MATCH );
drh281bbe22012-10-16 23:17:14 +0000854 assert( pTerm->eOperator & (WO_IN|WO_EQ|WO_LT|WO_LE|WO_GT|WO_GE|WO_MATCH) );
danielk19771d461462009-04-21 09:02:45 +0000855 j++;
856 }
857 for(i=0; i<nOrderBy; i++){
858 Expr *pExpr = pOrderBy->a[i].pExpr;
859 pIdxOrderBy[i].iColumn = pExpr->iColumn;
860 pIdxOrderBy[i].desc = pOrderBy->a[i].sortOrder;
861 }
862
863 return pIdxInfo;
864}
865
866/*
867** The table object reference passed as the second argument to this function
868** must represent a virtual table. This function invokes the xBestIndex()
drh3b48e8c2013-06-12 20:18:16 +0000869** method of the virtual table with the sqlite3_index_info object that
870** comes in as the 3rd argument to this function.
danielk19771d461462009-04-21 09:02:45 +0000871**
872** If an error occurs, pParse is populated with an error message and a
873** non-zero value is returned. Otherwise, 0 is returned and the output
874** part of the sqlite3_index_info structure is left populated.
875**
876** Whether or not an error is returned, it is the responsibility of the
877** caller to eventually free p->idxStr if p->needToFreeIdxStr indicates
878** that this is required.
879*/
880static int vtabBestIndex(Parse *pParse, Table *pTab, sqlite3_index_info *p){
danielk1977595a5232009-07-24 17:58:53 +0000881 sqlite3_vtab *pVtab = sqlite3GetVTable(pParse->db, pTab)->pVtab;
danielk19771d461462009-04-21 09:02:45 +0000882 int i;
883 int rc;
884
danielk19771d461462009-04-21 09:02:45 +0000885 TRACE_IDX_INPUTS(p);
886 rc = pVtab->pModule->xBestIndex(pVtab, p);
887 TRACE_IDX_OUTPUTS(p);
danielk19771d461462009-04-21 09:02:45 +0000888
889 if( rc!=SQLITE_OK ){
890 if( rc==SQLITE_NOMEM ){
891 pParse->db->mallocFailed = 1;
892 }else if( !pVtab->zErrMsg ){
893 sqlite3ErrorMsg(pParse, "%s", sqlite3ErrStr(rc));
894 }else{
895 sqlite3ErrorMsg(pParse, "%s", pVtab->zErrMsg);
896 }
897 }
drhb9755982010-07-24 16:34:37 +0000898 sqlite3_free(pVtab->zErrMsg);
danielk19771d461462009-04-21 09:02:45 +0000899 pVtab->zErrMsg = 0;
900
901 for(i=0; i<p->nConstraint; i++){
902 if( !p->aConstraint[i].usable && p->aConstraintUsage[i].argvIndex>0 ){
903 sqlite3ErrorMsg(pParse,
904 "table %s: xBestIndex returned an invalid plan", pTab->zName);
905 }
906 }
907
908 return pParse->nErr;
909}
drh7ba39a92013-05-30 17:43:19 +0000910#endif /* !defined(SQLITE_OMIT_VIRTUALTABLE) */
danielk19771d461462009-04-21 09:02:45 +0000911
drh1435a9a2013-08-27 23:15:44 +0000912#ifdef SQLITE_ENABLE_STAT3_OR_STAT4
drh28c4cf42005-07-27 20:41:43 +0000913/*
drhfaacf172011-08-12 01:51:45 +0000914** Estimate the location of a particular key among all keys in an
915** index. Store the results in aStat as follows:
drhe847d322011-01-20 02:56:37 +0000916**
dana3d0c132015-03-14 18:59:58 +0000917** aStat[0] Est. number of rows less than pRec
918** aStat[1] Est. number of rows equal to pRec
dan02fa4692009-08-17 17:06:58 +0000919**
drh6d3f91d2014-11-05 19:26:12 +0000920** Return the index of the sample that is the smallest sample that
dana3d0c132015-03-14 18:59:58 +0000921** is greater than or equal to pRec. Note that this index is not an index
922** into the aSample[] array - it is an index into a virtual set of samples
923** based on the contents of aSample[] and the number of fields in record
924** pRec.
dan02fa4692009-08-17 17:06:58 +0000925*/
drh6d3f91d2014-11-05 19:26:12 +0000926static int whereKeyStats(
dan02fa4692009-08-17 17:06:58 +0000927 Parse *pParse, /* Database connection */
928 Index *pIdx, /* Index to consider domain of */
dan7a419232013-08-06 20:01:43 +0000929 UnpackedRecord *pRec, /* Vector of values to consider */
drhfaacf172011-08-12 01:51:45 +0000930 int roundUp, /* Round up if true. Round down if false */
931 tRowcnt *aStat /* OUT: stats written here */
dan02fa4692009-08-17 17:06:58 +0000932){
danf52bb8d2013-08-03 20:24:58 +0000933 IndexSample *aSample = pIdx->aSample;
drhfbc38de2013-09-03 19:26:22 +0000934 int iCol; /* Index of required stats in anEq[] etc. */
dana3d0c132015-03-14 18:59:58 +0000935 int i; /* Index of first sample >= pRec */
936 int iSample; /* Smallest sample larger than or equal to pRec */
dan84c309b2013-08-08 16:17:12 +0000937 int iMin = 0; /* Smallest sample not yet tested */
dan84c309b2013-08-08 16:17:12 +0000938 int iTest; /* Next sample to test */
939 int res; /* Result of comparison operation */
dana3d0c132015-03-14 18:59:58 +0000940 int nField; /* Number of fields in pRec */
941 tRowcnt iLower = 0; /* anLt[] + anEq[] of largest sample pRec is > */
dan02fa4692009-08-17 17:06:58 +0000942
drh4f991892013-10-11 15:05:05 +0000943#ifndef SQLITE_DEBUG
944 UNUSED_PARAMETER( pParse );
945#endif
drh7f594752013-12-03 19:49:55 +0000946 assert( pRec!=0 );
drh5c624862011-09-22 18:46:34 +0000947 assert( pIdx->nSample>0 );
dana3d0c132015-03-14 18:59:58 +0000948 assert( pRec->nField>0 && pRec->nField<=pIdx->nSampleCol );
949
950 /* Do a binary search to find the first sample greater than or equal
951 ** to pRec. If pRec contains a single field, the set of samples to search
952 ** is simply the aSample[] array. If the samples in aSample[] contain more
953 ** than one fields, all fields following the first are ignored.
954 **
955 ** If pRec contains N fields, where N is more than one, then as well as the
956 ** samples in aSample[] (truncated to N fields), the search also has to
957 ** consider prefixes of those samples. For example, if the set of samples
958 ** in aSample is:
959 **
960 ** aSample[0] = (a, 5)
961 ** aSample[1] = (a, 10)
962 ** aSample[2] = (b, 5)
963 ** aSample[3] = (c, 100)
964 ** aSample[4] = (c, 105)
965 **
966 ** Then the search space should ideally be the samples above and the
967 ** unique prefixes [a], [b] and [c]. But since that is hard to organize,
968 ** the code actually searches this set:
969 **
970 ** 0: (a)
971 ** 1: (a, 5)
972 ** 2: (a, 10)
973 ** 3: (a, 10)
974 ** 4: (b)
975 ** 5: (b, 5)
976 ** 6: (c)
977 ** 7: (c, 100)
978 ** 8: (c, 105)
979 ** 9: (c, 105)
980 **
981 ** For each sample in the aSample[] array, N samples are present in the
982 ** effective sample array. In the above, samples 0 and 1 are based on
983 ** sample aSample[0]. Samples 2 and 3 on aSample[1] etc.
984 **
985 ** Often, sample i of each block of N effective samples has (i+1) fields.
986 ** Except, each sample may be extended to ensure that it is greater than or
987 ** equal to the previous sample in the array. For example, in the above,
988 ** sample 2 is the first sample of a block of N samples, so at first it
989 ** appears that it should be 1 field in size. However, that would make it
990 ** smaller than sample 1, so the binary search would not work. As a result,
991 ** it is extended to two fields. The duplicates that this creates do not
992 ** cause any problems.
993 */
994 nField = pRec->nField;
995 iCol = 0;
996 iSample = pIdx->nSample * nField;
dan84c309b2013-08-08 16:17:12 +0000997 do{
dana3d0c132015-03-14 18:59:58 +0000998 int iSamp; /* Index in aSample[] of test sample */
999 int n; /* Number of fields in test sample */
1000
1001 iTest = (iMin+iSample)/2;
1002 iSamp = iTest / nField;
1003 if( iSamp>0 ){
1004 /* The proposed effective sample is a prefix of sample aSample[iSamp].
1005 ** Specifically, the shortest prefix of at least (1 + iTest%nField)
1006 ** fields that is greater than the previous effective sample. */
1007 for(n=(iTest % nField) + 1; n<nField; n++){
1008 if( aSample[iSamp-1].anLt[n-1]!=aSample[iSamp].anLt[n-1] ) break;
1009 }
dan84c309b2013-08-08 16:17:12 +00001010 }else{
dana3d0c132015-03-14 18:59:58 +00001011 n = iTest + 1;
dan02fa4692009-08-17 17:06:58 +00001012 }
dana3d0c132015-03-14 18:59:58 +00001013
1014 pRec->nField = n;
1015 res = sqlite3VdbeRecordCompare(aSample[iSamp].n, aSample[iSamp].p, pRec);
1016 if( res<0 ){
1017 iLower = aSample[iSamp].anLt[n-1] + aSample[iSamp].anEq[n-1];
1018 iMin = iTest+1;
1019 }else if( res==0 && n<nField ){
1020 iLower = aSample[iSamp].anLt[n-1];
1021 iMin = iTest+1;
1022 res = -1;
1023 }else{
1024 iSample = iTest;
1025 iCol = n-1;
1026 }
1027 }while( res && iMin<iSample );
1028 i = iSample / nField;
drh51147ba2005-07-23 22:59:55 +00001029
dan84c309b2013-08-08 16:17:12 +00001030#ifdef SQLITE_DEBUG
1031 /* The following assert statements check that the binary search code
1032 ** above found the right answer. This block serves no purpose other
1033 ** than to invoke the asserts. */
dana3d0c132015-03-14 18:59:58 +00001034 if( pParse->db->mallocFailed==0 ){
1035 if( res==0 ){
1036 /* If (res==0) is true, then pRec must be equal to sample i. */
1037 assert( i<pIdx->nSample );
1038 assert( iCol==nField-1 );
1039 pRec->nField = nField;
1040 assert( 0==sqlite3VdbeRecordCompare(aSample[i].n, aSample[i].p, pRec)
1041 || pParse->db->mallocFailed
1042 );
1043 }else{
1044 /* Unless i==pIdx->nSample, indicating that pRec is larger than
1045 ** all samples in the aSample[] array, pRec must be smaller than the
1046 ** (iCol+1) field prefix of sample i. */
1047 assert( i<=pIdx->nSample && i>=0 );
1048 pRec->nField = iCol+1;
1049 assert( i==pIdx->nSample
1050 || sqlite3VdbeRecordCompare(aSample[i].n, aSample[i].p, pRec)>0
1051 || pParse->db->mallocFailed );
1052
1053 /* if i==0 and iCol==0, then record pRec is smaller than all samples
1054 ** in the aSample[] array. Otherwise, if (iCol>0) then pRec must
1055 ** be greater than or equal to the (iCol) field prefix of sample i.
1056 ** If (i>0), then pRec must also be greater than sample (i-1). */
1057 if( iCol>0 ){
1058 pRec->nField = iCol;
1059 assert( sqlite3VdbeRecordCompare(aSample[i].n, aSample[i].p, pRec)<=0
1060 || pParse->db->mallocFailed );
1061 }
1062 if( i>0 ){
1063 pRec->nField = nField;
1064 assert( sqlite3VdbeRecordCompare(aSample[i-1].n, aSample[i-1].p, pRec)<0
1065 || pParse->db->mallocFailed );
1066 }
1067 }
drhfaacf172011-08-12 01:51:45 +00001068 }
dan84c309b2013-08-08 16:17:12 +00001069#endif /* ifdef SQLITE_DEBUG */
dan02fa4692009-08-17 17:06:58 +00001070
dan84c309b2013-08-08 16:17:12 +00001071 if( res==0 ){
dana3d0c132015-03-14 18:59:58 +00001072 /* Record pRec is equal to sample i */
1073 assert( iCol==nField-1 );
daneea568d2013-08-07 19:46:15 +00001074 aStat[0] = aSample[i].anLt[iCol];
1075 aStat[1] = aSample[i].anEq[iCol];
drhfaacf172011-08-12 01:51:45 +00001076 }else{
dana3d0c132015-03-14 18:59:58 +00001077 /* At this point, the (iCol+1) field prefix of aSample[i] is the first
1078 ** sample that is greater than pRec. Or, if i==pIdx->nSample then pRec
1079 ** is larger than all samples in the array. */
1080 tRowcnt iUpper, iGap;
1081 if( i>=pIdx->nSample ){
1082 iUpper = sqlite3LogEstToInt(pIdx->aiRowLogEst[0]);
drhfaacf172011-08-12 01:51:45 +00001083 }else{
dana3d0c132015-03-14 18:59:58 +00001084 iUpper = aSample[i].anLt[iCol];
drhfaacf172011-08-12 01:51:45 +00001085 }
dana3d0c132015-03-14 18:59:58 +00001086
drhfaacf172011-08-12 01:51:45 +00001087 if( iLower>=iUpper ){
1088 iGap = 0;
1089 }else{
1090 iGap = iUpper - iLower;
drhfaacf172011-08-12 01:51:45 +00001091 }
1092 if( roundUp ){
1093 iGap = (iGap*2)/3;
1094 }else{
1095 iGap = iGap/3;
1096 }
1097 aStat[0] = iLower + iGap;
dana3d0c132015-03-14 18:59:58 +00001098 aStat[1] = pIdx->aAvgEq[iCol];
dan02fa4692009-08-17 17:06:58 +00001099 }
dana3d0c132015-03-14 18:59:58 +00001100
1101 /* Restore the pRec->nField value before returning. */
1102 pRec->nField = nField;
drh6d3f91d2014-11-05 19:26:12 +00001103 return i;
dan02fa4692009-08-17 17:06:58 +00001104}
drh1435a9a2013-08-27 23:15:44 +00001105#endif /* SQLITE_ENABLE_STAT3_OR_STAT4 */
dan937d0de2009-10-15 18:35:38 +00001106
1107/*
danaa9933c2014-04-24 20:04:49 +00001108** If it is not NULL, pTerm is a term that provides an upper or lower
1109** bound on a range scan. Without considering pTerm, it is estimated
1110** that the scan will visit nNew rows. This function returns the number
1111** estimated to be visited after taking pTerm into account.
1112**
1113** If the user explicitly specified a likelihood() value for this term,
1114** then the return value is the likelihood multiplied by the number of
1115** input rows. Otherwise, this function assumes that an "IS NOT NULL" term
1116** has a likelihood of 0.50, and any other term a likelihood of 0.25.
1117*/
1118static LogEst whereRangeAdjust(WhereTerm *pTerm, LogEst nNew){
1119 LogEst nRet = nNew;
1120 if( pTerm ){
1121 if( pTerm->truthProb<=0 ){
1122 nRet += pTerm->truthProb;
dan7de2a1f2014-04-28 20:11:20 +00001123 }else if( (pTerm->wtFlags & TERM_VNULL)==0 ){
danaa9933c2014-04-24 20:04:49 +00001124 nRet -= 20; assert( 20==sqlite3LogEst(4) );
1125 }
1126 }
1127 return nRet;
1128}
1129
mistachkin2d84ac42014-06-26 21:32:09 +00001130#ifdef SQLITE_ENABLE_STAT3_OR_STAT4
danb0b82902014-06-26 20:21:46 +00001131/*
1132** This function is called to estimate the number of rows visited by a
1133** range-scan on a skip-scan index. For example:
1134**
1135** CREATE INDEX i1 ON t1(a, b, c);
1136** SELECT * FROM t1 WHERE a=? AND c BETWEEN ? AND ?;
1137**
1138** Value pLoop->nOut is currently set to the estimated number of rows
1139** visited for scanning (a=? AND b=?). This function reduces that estimate
1140** by some factor to account for the (c BETWEEN ? AND ?) expression based
1141** on the stat4 data for the index. this scan will be peformed multiple
1142** times (once for each (a,b) combination that matches a=?) is dealt with
1143** by the caller.
1144**
1145** It does this by scanning through all stat4 samples, comparing values
1146** extracted from pLower and pUpper with the corresponding column in each
1147** sample. If L and U are the number of samples found to be less than or
1148** equal to the values extracted from pLower and pUpper respectively, and
1149** N is the total number of samples, the pLoop->nOut value is adjusted
1150** as follows:
1151**
1152** nOut = nOut * ( min(U - L, 1) / N )
1153**
1154** If pLower is NULL, or a value cannot be extracted from the term, L is
1155** set to zero. If pUpper is NULL, or a value cannot be extracted from it,
1156** U is set to N.
1157**
1158** Normally, this function sets *pbDone to 1 before returning. However,
1159** if no value can be extracted from either pLower or pUpper (and so the
1160** estimate of the number of rows delivered remains unchanged), *pbDone
1161** is left as is.
1162**
1163** If an error occurs, an SQLite error code is returned. Otherwise,
1164** SQLITE_OK.
1165*/
1166static int whereRangeSkipScanEst(
1167 Parse *pParse, /* Parsing & code generating context */
1168 WhereTerm *pLower, /* Lower bound on the range. ex: "x>123" Might be NULL */
1169 WhereTerm *pUpper, /* Upper bound on the range. ex: "x<455" Might be NULL */
1170 WhereLoop *pLoop, /* Update the .nOut value of this loop */
1171 int *pbDone /* Set to true if at least one expr. value extracted */
1172){
1173 Index *p = pLoop->u.btree.pIndex;
1174 int nEq = pLoop->u.btree.nEq;
1175 sqlite3 *db = pParse->db;
dan4e42ba42014-06-27 20:14:25 +00001176 int nLower = -1;
1177 int nUpper = p->nSample+1;
danb0b82902014-06-26 20:21:46 +00001178 int rc = SQLITE_OK;
drhd15f87e2014-07-24 22:41:20 +00001179 int iCol = p->aiColumn[nEq];
1180 u8 aff = iCol>=0 ? p->pTable->aCol[iCol].affinity : SQLITE_AFF_INTEGER;
danb0b82902014-06-26 20:21:46 +00001181 CollSeq *pColl;
1182
1183 sqlite3_value *p1 = 0; /* Value extracted from pLower */
1184 sqlite3_value *p2 = 0; /* Value extracted from pUpper */
1185 sqlite3_value *pVal = 0; /* Value extracted from record */
1186
1187 pColl = sqlite3LocateCollSeq(pParse, p->azColl[nEq]);
1188 if( pLower ){
1189 rc = sqlite3Stat4ValueFromExpr(pParse, pLower->pExpr->pRight, aff, &p1);
dan4e42ba42014-06-27 20:14:25 +00001190 nLower = 0;
danb0b82902014-06-26 20:21:46 +00001191 }
1192 if( pUpper && rc==SQLITE_OK ){
1193 rc = sqlite3Stat4ValueFromExpr(pParse, pUpper->pExpr->pRight, aff, &p2);
dan4e42ba42014-06-27 20:14:25 +00001194 nUpper = p2 ? 0 : p->nSample;
danb0b82902014-06-26 20:21:46 +00001195 }
1196
1197 if( p1 || p2 ){
1198 int i;
1199 int nDiff;
1200 for(i=0; rc==SQLITE_OK && i<p->nSample; i++){
1201 rc = sqlite3Stat4Column(db, p->aSample[i].p, p->aSample[i].n, nEq, &pVal);
1202 if( rc==SQLITE_OK && p1 ){
1203 int res = sqlite3MemCompare(p1, pVal, pColl);
dan4e42ba42014-06-27 20:14:25 +00001204 if( res>=0 ) nLower++;
danb0b82902014-06-26 20:21:46 +00001205 }
1206 if( rc==SQLITE_OK && p2 ){
1207 int res = sqlite3MemCompare(p2, pVal, pColl);
dan4e42ba42014-06-27 20:14:25 +00001208 if( res>=0 ) nUpper++;
danb0b82902014-06-26 20:21:46 +00001209 }
1210 }
danb0b82902014-06-26 20:21:46 +00001211 nDiff = (nUpper - nLower);
1212 if( nDiff<=0 ) nDiff = 1;
dan4e42ba42014-06-27 20:14:25 +00001213
1214 /* If there is both an upper and lower bound specified, and the
1215 ** comparisons indicate that they are close together, use the fallback
1216 ** method (assume that the scan visits 1/64 of the rows) for estimating
1217 ** the number of rows visited. Otherwise, estimate the number of rows
1218 ** using the method described in the header comment for this function. */
1219 if( nDiff!=1 || pUpper==0 || pLower==0 ){
1220 int nAdjust = (sqlite3LogEst(p->nSample) - sqlite3LogEst(nDiff));
1221 pLoop->nOut -= nAdjust;
1222 *pbDone = 1;
1223 WHERETRACE(0x10, ("range skip-scan regions: %u..%u adjust=%d est=%d\n",
danfa887452014-06-28 15:26:10 +00001224 nLower, nUpper, nAdjust*-1, pLoop->nOut));
dan4e42ba42014-06-27 20:14:25 +00001225 }
1226
danb0b82902014-06-26 20:21:46 +00001227 }else{
1228 assert( *pbDone==0 );
1229 }
1230
1231 sqlite3ValueFree(p1);
1232 sqlite3ValueFree(p2);
1233 sqlite3ValueFree(pVal);
1234
1235 return rc;
1236}
mistachkin2d84ac42014-06-26 21:32:09 +00001237#endif /* SQLITE_ENABLE_STAT3_OR_STAT4 */
danb0b82902014-06-26 20:21:46 +00001238
danaa9933c2014-04-24 20:04:49 +00001239/*
dan02fa4692009-08-17 17:06:58 +00001240** This function is used to estimate the number of rows that will be visited
1241** by scanning an index for a range of values. The range may have an upper
1242** bound, a lower bound, or both. The WHERE clause terms that set the upper
1243** and lower bounds are represented by pLower and pUpper respectively. For
1244** example, assuming that index p is on t1(a):
1245**
1246** ... FROM t1 WHERE a > ? AND a < ? ...
1247** |_____| |_____|
1248** | |
1249** pLower pUpper
1250**
drh98cdf622009-08-20 18:14:42 +00001251** If either of the upper or lower bound is not present, then NULL is passed in
drhcdaca552009-08-20 13:45:07 +00001252** place of the corresponding WhereTerm.
dan02fa4692009-08-17 17:06:58 +00001253**
drh6d3f91d2014-11-05 19:26:12 +00001254** The value in (pBuilder->pNew->u.btree.nEq) is the number of the index
dan6cb8d762013-08-08 11:48:57 +00001255** column subject to the range constraint. Or, equivalently, the number of
1256** equality constraints optimized by the proposed index scan. For example,
1257** assuming index p is on t1(a, b), and the SQL query is:
dan02fa4692009-08-17 17:06:58 +00001258**
1259** ... FROM t1 WHERE a = ? AND b > ? AND b < ? ...
1260**
dan6cb8d762013-08-08 11:48:57 +00001261** then nEq is set to 1 (as the range restricted column, b, is the second
1262** left-most column of the index). Or, if the query is:
dan02fa4692009-08-17 17:06:58 +00001263**
1264** ... FROM t1 WHERE a > ? AND a < ? ...
1265**
dan6cb8d762013-08-08 11:48:57 +00001266** then nEq is set to 0.
dan02fa4692009-08-17 17:06:58 +00001267**
drhbf539c42013-10-05 18:16:02 +00001268** When this function is called, *pnOut is set to the sqlite3LogEst() of the
dan6cb8d762013-08-08 11:48:57 +00001269** number of rows that the index scan is expected to visit without
drh6d3f91d2014-11-05 19:26:12 +00001270** considering the range constraints. If nEq is 0, then *pnOut is the number of
dan6cb8d762013-08-08 11:48:57 +00001271** rows in the index. Assuming no error occurs, *pnOut is adjusted (reduced)
peter.d.reid60ec9142014-09-06 16:39:46 +00001272** to account for the range constraints pLower and pUpper.
dan6cb8d762013-08-08 11:48:57 +00001273**
1274** In the absence of sqlite_stat4 ANALYZE data, or if such data cannot be
drh94aa7e02014-06-06 17:09:52 +00001275** used, a single range inequality reduces the search space by a factor of 4.
1276** and a pair of constraints (x>? AND x<?) reduces the expected number of
1277** rows visited by a factor of 64.
dan02fa4692009-08-17 17:06:58 +00001278*/
1279static int whereRangeScanEst(
drhcdaca552009-08-20 13:45:07 +00001280 Parse *pParse, /* Parsing & code generating context */
dan7a419232013-08-06 20:01:43 +00001281 WhereLoopBuilder *pBuilder,
drhcdaca552009-08-20 13:45:07 +00001282 WhereTerm *pLower, /* Lower bound on the range. ex: "x>123" Might be NULL */
1283 WhereTerm *pUpper, /* Upper bound on the range. ex: "x<455" Might be NULL */
drh186ad8c2013-10-08 18:40:37 +00001284 WhereLoop *pLoop /* Modify the .nOut and maybe .rRun fields */
dan02fa4692009-08-17 17:06:58 +00001285){
dan69188d92009-08-19 08:18:32 +00001286 int rc = SQLITE_OK;
drh186ad8c2013-10-08 18:40:37 +00001287 int nOut = pLoop->nOut;
drhbf539c42013-10-05 18:16:02 +00001288 LogEst nNew;
dan69188d92009-08-19 08:18:32 +00001289
drh1435a9a2013-08-27 23:15:44 +00001290#ifdef SQLITE_ENABLE_STAT3_OR_STAT4
drh186ad8c2013-10-08 18:40:37 +00001291 Index *p = pLoop->u.btree.pIndex;
drh4f991892013-10-11 15:05:05 +00001292 int nEq = pLoop->u.btree.nEq;
dan02fa4692009-08-17 17:06:58 +00001293
drh6d3f91d2014-11-05 19:26:12 +00001294 if( p->nSample>0 && nEq<p->nSampleCol ){
danb0b82902014-06-26 20:21:46 +00001295 if( nEq==pBuilder->nRecValid ){
1296 UnpackedRecord *pRec = pBuilder->pRec;
1297 tRowcnt a[2];
1298 u8 aff;
drh98cdf622009-08-20 18:14:42 +00001299
danb0b82902014-06-26 20:21:46 +00001300 /* Variable iLower will be set to the estimate of the number of rows in
1301 ** the index that are less than the lower bound of the range query. The
1302 ** lower bound being the concatenation of $P and $L, where $P is the
1303 ** key-prefix formed by the nEq values matched against the nEq left-most
1304 ** columns of the index, and $L is the value in pLower.
1305 **
1306 ** Or, if pLower is NULL or $L cannot be extracted from it (because it
1307 ** is not a simple variable or literal value), the lower bound of the
1308 ** range is $P. Due to a quirk in the way whereKeyStats() works, even
1309 ** if $L is available, whereKeyStats() is called for both ($P) and
drh6d3f91d2014-11-05 19:26:12 +00001310 ** ($P:$L) and the larger of the two returned values is used.
danb0b82902014-06-26 20:21:46 +00001311 **
1312 ** Similarly, iUpper is to be set to the estimate of the number of rows
1313 ** less than the upper bound of the range query. Where the upper bound
1314 ** is either ($P) or ($P:$U). Again, even if $U is available, both values
1315 ** of iUpper are requested of whereKeyStats() and the smaller used.
drh6d3f91d2014-11-05 19:26:12 +00001316 **
1317 ** The number of rows between the two bounds is then just iUpper-iLower.
danb0b82902014-06-26 20:21:46 +00001318 */
drh6d3f91d2014-11-05 19:26:12 +00001319 tRowcnt iLower; /* Rows less than the lower bound */
1320 tRowcnt iUpper; /* Rows less than the upper bound */
1321 int iLwrIdx = -2; /* aSample[] for the lower bound */
1322 int iUprIdx = -1; /* aSample[] for the upper bound */
danb3c02e22013-08-08 19:38:40 +00001323
drhb34fc5b2014-08-28 17:20:37 +00001324 if( pRec ){
1325 testcase( pRec->nField!=pBuilder->nRecValid );
1326 pRec->nField = pBuilder->nRecValid;
1327 }
danb0b82902014-06-26 20:21:46 +00001328 if( nEq==p->nKeyCol ){
1329 aff = SQLITE_AFF_INTEGER;
dan7a419232013-08-06 20:01:43 +00001330 }else{
danb0b82902014-06-26 20:21:46 +00001331 aff = p->pTable->aCol[p->aiColumn[nEq]].affinity;
drhfaacf172011-08-12 01:51:45 +00001332 }
danb0b82902014-06-26 20:21:46 +00001333 /* Determine iLower and iUpper using ($P) only. */
1334 if( nEq==0 ){
1335 iLower = 0;
drh9f07cf72014-10-22 15:27:05 +00001336 iUpper = p->nRowEst0;
danb0b82902014-06-26 20:21:46 +00001337 }else{
1338 /* Note: this call could be optimized away - since the same values must
1339 ** have been requested when testing key $P in whereEqualScanEst(). */
1340 whereKeyStats(pParse, p, pRec, 0, a);
1341 iLower = a[0];
1342 iUpper = a[0] + a[1];
dan6cb8d762013-08-08 11:48:57 +00001343 }
danb0b82902014-06-26 20:21:46 +00001344
drh69afd992014-10-08 02:53:25 +00001345 assert( pLower==0 || (pLower->eOperator & (WO_GT|WO_GE))!=0 );
1346 assert( pUpper==0 || (pUpper->eOperator & (WO_LT|WO_LE))!=0 );
drh681fca02014-10-10 15:01:46 +00001347 assert( p->aSortOrder!=0 );
1348 if( p->aSortOrder[nEq] ){
drh69afd992014-10-08 02:53:25 +00001349 /* The roles of pLower and pUpper are swapped for a DESC index */
1350 SWAP(WhereTerm*, pLower, pUpper);
1351 }
1352
danb0b82902014-06-26 20:21:46 +00001353 /* If possible, improve on the iLower estimate using ($P:$L). */
1354 if( pLower ){
1355 int bOk; /* True if value is extracted from pExpr */
1356 Expr *pExpr = pLower->pExpr->pRight;
danb0b82902014-06-26 20:21:46 +00001357 rc = sqlite3Stat4ProbeSetValue(pParse, p, &pRec, pExpr, aff, nEq, &bOk);
1358 if( rc==SQLITE_OK && bOk ){
1359 tRowcnt iNew;
drh6d3f91d2014-11-05 19:26:12 +00001360 iLwrIdx = whereKeyStats(pParse, p, pRec, 0, a);
drh69afd992014-10-08 02:53:25 +00001361 iNew = a[0] + ((pLower->eOperator & (WO_GT|WO_LE)) ? a[1] : 0);
danb0b82902014-06-26 20:21:46 +00001362 if( iNew>iLower ) iLower = iNew;
1363 nOut--;
danf741e042014-08-25 18:29:38 +00001364 pLower = 0;
danb0b82902014-06-26 20:21:46 +00001365 }
1366 }
1367
1368 /* If possible, improve on the iUpper estimate using ($P:$U). */
1369 if( pUpper ){
1370 int bOk; /* True if value is extracted from pExpr */
1371 Expr *pExpr = pUpper->pExpr->pRight;
danb0b82902014-06-26 20:21:46 +00001372 rc = sqlite3Stat4ProbeSetValue(pParse, p, &pRec, pExpr, aff, nEq, &bOk);
1373 if( rc==SQLITE_OK && bOk ){
1374 tRowcnt iNew;
drh6d3f91d2014-11-05 19:26:12 +00001375 iUprIdx = whereKeyStats(pParse, p, pRec, 1, a);
drh69afd992014-10-08 02:53:25 +00001376 iNew = a[0] + ((pUpper->eOperator & (WO_GT|WO_LE)) ? a[1] : 0);
danb0b82902014-06-26 20:21:46 +00001377 if( iNew<iUpper ) iUpper = iNew;
1378 nOut--;
danf741e042014-08-25 18:29:38 +00001379 pUpper = 0;
danb0b82902014-06-26 20:21:46 +00001380 }
1381 }
1382
1383 pBuilder->pRec = pRec;
1384 if( rc==SQLITE_OK ){
1385 if( iUpper>iLower ){
1386 nNew = sqlite3LogEst(iUpper - iLower);
drh6d3f91d2014-11-05 19:26:12 +00001387 /* TUNING: If both iUpper and iLower are derived from the same
1388 ** sample, then assume they are 4x more selective. This brings
1389 ** the estimated selectivity more in line with what it would be
1390 ** if estimated without the use of STAT3/4 tables. */
1391 if( iLwrIdx==iUprIdx ) nNew -= 20; assert( 20==sqlite3LogEst(4) );
danb0b82902014-06-26 20:21:46 +00001392 }else{
1393 nNew = 10; assert( 10==sqlite3LogEst(2) );
1394 }
1395 if( nNew<nOut ){
1396 nOut = nNew;
1397 }
drhae914d72014-08-28 19:38:22 +00001398 WHERETRACE(0x10, ("STAT4 range scan: %u..%u est=%d\n",
danb0b82902014-06-26 20:21:46 +00001399 (u32)iLower, (u32)iUpper, nOut));
danb0b82902014-06-26 20:21:46 +00001400 }
1401 }else{
1402 int bDone = 0;
1403 rc = whereRangeSkipScanEst(pParse, pLower, pUpper, pLoop, &bDone);
1404 if( bDone ) return rc;
drh98cdf622009-08-20 18:14:42 +00001405 }
dan02fa4692009-08-17 17:06:58 +00001406 }
drh3f022182009-09-09 16:10:50 +00001407#else
1408 UNUSED_PARAMETER(pParse);
dan7a419232013-08-06 20:01:43 +00001409 UNUSED_PARAMETER(pBuilder);
dan02fa4692009-08-17 17:06:58 +00001410 assert( pLower || pUpper );
danf741e042014-08-25 18:29:38 +00001411#endif
dan7de2a1f2014-04-28 20:11:20 +00001412 assert( pUpper==0 || (pUpper->wtFlags & TERM_VNULL)==0 );
danaa9933c2014-04-24 20:04:49 +00001413 nNew = whereRangeAdjust(pLower, nOut);
1414 nNew = whereRangeAdjust(pUpper, nNew);
dan7de2a1f2014-04-28 20:11:20 +00001415
drh4dd96a82014-10-24 15:26:29 +00001416 /* TUNING: If there is both an upper and lower limit and neither limit
1417 ** has an application-defined likelihood(), assume the range is
dan42685f22014-04-28 19:34:06 +00001418 ** reduced by an additional 75%. This means that, by default, an open-ended
1419 ** range query (e.g. col > ?) is assumed to match 1/4 of the rows in the
1420 ** index. While a closed range (e.g. col BETWEEN ? AND ?) is estimated to
1421 ** match 1/64 of the index. */
drh4dd96a82014-10-24 15:26:29 +00001422 if( pLower && pLower->truthProb>0 && pUpper && pUpper->truthProb>0 ){
1423 nNew -= 20;
1424 }
dan7de2a1f2014-04-28 20:11:20 +00001425
danaa9933c2014-04-24 20:04:49 +00001426 nOut -= (pLower!=0) + (pUpper!=0);
drhabfa6d52013-09-11 03:53:22 +00001427 if( nNew<10 ) nNew = 10;
1428 if( nNew<nOut ) nOut = nNew;
drhae914d72014-08-28 19:38:22 +00001429#if defined(WHERETRACE_ENABLED)
1430 if( pLoop->nOut>nOut ){
1431 WHERETRACE(0x10,("Range scan lowers nOut from %d to %d\n",
1432 pLoop->nOut, nOut));
1433 }
1434#endif
drh186ad8c2013-10-08 18:40:37 +00001435 pLoop->nOut = (LogEst)nOut;
dan02fa4692009-08-17 17:06:58 +00001436 return rc;
1437}
1438
drh1435a9a2013-08-27 23:15:44 +00001439#ifdef SQLITE_ENABLE_STAT3_OR_STAT4
drh82759752011-01-20 16:52:09 +00001440/*
1441** Estimate the number of rows that will be returned based on
1442** an equality constraint x=VALUE and where that VALUE occurs in
1443** the histogram data. This only works when x is the left-most
drhfaacf172011-08-12 01:51:45 +00001444** column of an index and sqlite_stat3 histogram data is available
drhac8eb112011-03-17 01:58:21 +00001445** for that index. When pExpr==NULL that means the constraint is
1446** "x IS NULL" instead of "x=VALUE".
drh82759752011-01-20 16:52:09 +00001447**
drh0c50fa02011-01-21 16:27:18 +00001448** Write the estimated row count into *pnRow and return SQLITE_OK.
1449** If unable to make an estimate, leave *pnRow unchanged and return
1450** non-zero.
drh9b3eb0a2011-01-21 14:37:04 +00001451**
1452** This routine can fail if it is unable to load a collating sequence
1453** required for string comparison, or if unable to allocate memory
1454** for a UTF conversion required for comparison. The error is stored
1455** in the pParse structure.
drh82759752011-01-20 16:52:09 +00001456*/
drh041e09f2011-04-07 19:56:21 +00001457static int whereEqualScanEst(
drh82759752011-01-20 16:52:09 +00001458 Parse *pParse, /* Parsing & code generating context */
dan7a419232013-08-06 20:01:43 +00001459 WhereLoopBuilder *pBuilder,
drh0c50fa02011-01-21 16:27:18 +00001460 Expr *pExpr, /* Expression for VALUE in the x=VALUE constraint */
drhb8a8e8a2013-06-10 19:12:39 +00001461 tRowcnt *pnRow /* Write the revised row estimate here */
drh82759752011-01-20 16:52:09 +00001462){
dan7a419232013-08-06 20:01:43 +00001463 Index *p = pBuilder->pNew->u.btree.pIndex;
1464 int nEq = pBuilder->pNew->u.btree.nEq;
1465 UnpackedRecord *pRec = pBuilder->pRec;
drh82759752011-01-20 16:52:09 +00001466 u8 aff; /* Column affinity */
1467 int rc; /* Subfunction return code */
drhfaacf172011-08-12 01:51:45 +00001468 tRowcnt a[2]; /* Statistics */
dan7a419232013-08-06 20:01:43 +00001469 int bOk;
drh82759752011-01-20 16:52:09 +00001470
dan7a419232013-08-06 20:01:43 +00001471 assert( nEq>=1 );
danfd984b82014-06-30 18:02:20 +00001472 assert( nEq<=p->nColumn );
drh82759752011-01-20 16:52:09 +00001473 assert( p->aSample!=0 );
drh5c624862011-09-22 18:46:34 +00001474 assert( p->nSample>0 );
dan7a419232013-08-06 20:01:43 +00001475 assert( pBuilder->nRecValid<nEq );
1476
1477 /* If values are not available for all fields of the index to the left
1478 ** of this one, no estimate can be made. Return SQLITE_NOTFOUND. */
1479 if( pBuilder->nRecValid<(nEq-1) ){
1480 return SQLITE_NOTFOUND;
drh1f9c7662011-03-17 01:34:26 +00001481 }
dan7a419232013-08-06 20:01:43 +00001482
dandd6e1f12013-08-10 19:08:30 +00001483 /* This is an optimization only. The call to sqlite3Stat4ProbeSetValue()
1484 ** below would return the same value. */
danfd984b82014-06-30 18:02:20 +00001485 if( nEq>=p->nColumn ){
dan7a419232013-08-06 20:01:43 +00001486 *pnRow = 1;
1487 return SQLITE_OK;
drh82759752011-01-20 16:52:09 +00001488 }
dan7a419232013-08-06 20:01:43 +00001489
daneea568d2013-08-07 19:46:15 +00001490 aff = p->pTable->aCol[p->aiColumn[nEq-1]].affinity;
dan87cd9322013-08-07 15:52:41 +00001491 rc = sqlite3Stat4ProbeSetValue(pParse, p, &pRec, pExpr, aff, nEq-1, &bOk);
1492 pBuilder->pRec = pRec;
dan7a419232013-08-06 20:01:43 +00001493 if( rc!=SQLITE_OK ) return rc;
1494 if( bOk==0 ) return SQLITE_NOTFOUND;
dan7a419232013-08-06 20:01:43 +00001495 pBuilder->nRecValid = nEq;
dan7a419232013-08-06 20:01:43 +00001496
danb3c02e22013-08-08 19:38:40 +00001497 whereKeyStats(pParse, p, pRec, 0, a);
drh989578e2013-10-28 14:34:35 +00001498 WHERETRACE(0x10,("equality scan regions: %d\n", (int)a[1]));
danb3c02e22013-08-08 19:38:40 +00001499 *pnRow = a[1];
daneea568d2013-08-07 19:46:15 +00001500
drh0c50fa02011-01-21 16:27:18 +00001501 return rc;
1502}
drh1435a9a2013-08-27 23:15:44 +00001503#endif /* SQLITE_ENABLE_STAT3_OR_STAT4 */
drh0c50fa02011-01-21 16:27:18 +00001504
drh1435a9a2013-08-27 23:15:44 +00001505#ifdef SQLITE_ENABLE_STAT3_OR_STAT4
drh0c50fa02011-01-21 16:27:18 +00001506/*
1507** Estimate the number of rows that will be returned based on
drh5ac06072011-01-21 18:18:13 +00001508** an IN constraint where the right-hand side of the IN operator
1509** is a list of values. Example:
1510**
1511** WHERE x IN (1,2,3,4)
drh0c50fa02011-01-21 16:27:18 +00001512**
1513** Write the estimated row count into *pnRow and return SQLITE_OK.
1514** If unable to make an estimate, leave *pnRow unchanged and return
1515** non-zero.
1516**
1517** This routine can fail if it is unable to load a collating sequence
1518** required for string comparison, or if unable to allocate memory
1519** for a UTF conversion required for comparison. The error is stored
1520** in the pParse structure.
1521*/
drh041e09f2011-04-07 19:56:21 +00001522static int whereInScanEst(
drh0c50fa02011-01-21 16:27:18 +00001523 Parse *pParse, /* Parsing & code generating context */
dan7a419232013-08-06 20:01:43 +00001524 WhereLoopBuilder *pBuilder,
drh0c50fa02011-01-21 16:27:18 +00001525 ExprList *pList, /* The value list on the RHS of "x IN (v1,v2,v3,...)" */
drhb8a8e8a2013-06-10 19:12:39 +00001526 tRowcnt *pnRow /* Write the revised row estimate here */
drh0c50fa02011-01-21 16:27:18 +00001527){
dan7a419232013-08-06 20:01:43 +00001528 Index *p = pBuilder->pNew->u.btree.pIndex;
dancfc9df72014-04-25 15:01:01 +00001529 i64 nRow0 = sqlite3LogEstToInt(p->aiRowLogEst[0]);
dan7a419232013-08-06 20:01:43 +00001530 int nRecValid = pBuilder->nRecValid;
drhb8a8e8a2013-06-10 19:12:39 +00001531 int rc = SQLITE_OK; /* Subfunction return code */
1532 tRowcnt nEst; /* Number of rows for a single term */
1533 tRowcnt nRowEst = 0; /* New estimate of the number of rows */
1534 int i; /* Loop counter */
drh0c50fa02011-01-21 16:27:18 +00001535
1536 assert( p->aSample!=0 );
drhfaacf172011-08-12 01:51:45 +00001537 for(i=0; rc==SQLITE_OK && i<pList->nExpr; i++){
dancfc9df72014-04-25 15:01:01 +00001538 nEst = nRow0;
dan7a419232013-08-06 20:01:43 +00001539 rc = whereEqualScanEst(pParse, pBuilder, pList->a[i].pExpr, &nEst);
drhfaacf172011-08-12 01:51:45 +00001540 nRowEst += nEst;
dan7a419232013-08-06 20:01:43 +00001541 pBuilder->nRecValid = nRecValid;
drh0c50fa02011-01-21 16:27:18 +00001542 }
dan7a419232013-08-06 20:01:43 +00001543
drh0c50fa02011-01-21 16:27:18 +00001544 if( rc==SQLITE_OK ){
dancfc9df72014-04-25 15:01:01 +00001545 if( nRowEst > nRow0 ) nRowEst = nRow0;
drh0c50fa02011-01-21 16:27:18 +00001546 *pnRow = nRowEst;
drh5418b122014-08-28 13:42:13 +00001547 WHERETRACE(0x10,("IN row estimate: est=%d\n", nRowEst));
drh0c50fa02011-01-21 16:27:18 +00001548 }
dan7a419232013-08-06 20:01:43 +00001549 assert( pBuilder->nRecValid==nRecValid );
drh0c50fa02011-01-21 16:27:18 +00001550 return rc;
drh82759752011-01-20 16:52:09 +00001551}
drh1435a9a2013-08-27 23:15:44 +00001552#endif /* SQLITE_ENABLE_STAT3_OR_STAT4 */
drh82759752011-01-20 16:52:09 +00001553
drh111a6a72008-12-21 03:51:16 +00001554
drhd15cb172013-05-21 19:23:10 +00001555#ifdef WHERETRACE_ENABLED
drha18f3d22013-05-08 03:05:41 +00001556/*
drhc90713d2014-09-30 13:46:49 +00001557** Print the content of a WhereTerm object
1558*/
1559static void whereTermPrint(WhereTerm *pTerm, int iTerm){
drh0a99ba32014-09-30 17:03:35 +00001560 if( pTerm==0 ){
1561 sqlite3DebugPrintf("TERM-%-3d NULL\n", iTerm);
1562 }else{
1563 char zType[4];
1564 memcpy(zType, "...", 4);
1565 if( pTerm->wtFlags & TERM_VIRTUAL ) zType[0] = 'V';
1566 if( pTerm->eOperator & WO_EQUIV ) zType[1] = 'E';
1567 if( ExprHasProperty(pTerm->pExpr, EP_FromJoin) ) zType[2] = 'L';
drhfcd49532015-05-13 15:24:07 +00001568 sqlite3DebugPrintf(
1569 "TERM-%-3d %p %s cursor=%-3d prob=%-3d op=0x%03x wtFlags=0x%04x\n",
1570 iTerm, pTerm, zType, pTerm->leftCursor, pTerm->truthProb,
1571 pTerm->eOperator, pTerm->wtFlags);
drh0a99ba32014-09-30 17:03:35 +00001572 sqlite3TreeViewExpr(0, pTerm->pExpr, 0);
1573 }
drhc90713d2014-09-30 13:46:49 +00001574}
1575#endif
1576
1577#ifdef WHERETRACE_ENABLED
1578/*
drha18f3d22013-05-08 03:05:41 +00001579** Print a WhereLoop object for debugging purposes
1580*/
drhc1ba2e72013-10-28 19:03:21 +00001581static void whereLoopPrint(WhereLoop *p, WhereClause *pWC){
1582 WhereInfo *pWInfo = pWC->pWInfo;
drh989578e2013-10-28 14:34:35 +00001583 int nb = 1+(pWInfo->pTabList->nSrc+7)/8;
1584 struct SrcList_item *pItem = pWInfo->pTabList->a + p->iTab;
drha18f3d22013-05-08 03:05:41 +00001585 Table *pTab = pItem->pTab;
drh6457a352013-06-21 00:35:37 +00001586 sqlite3DebugPrintf("%c%2d.%0*llx.%0*llx", p->cId,
drha184fb82013-05-08 04:22:59 +00001587 p->iTab, nb, p->maskSelf, nb, p->prereq);
drh6457a352013-06-21 00:35:37 +00001588 sqlite3DebugPrintf(" %12s",
drha18f3d22013-05-08 03:05:41 +00001589 pItem->zAlias ? pItem->zAlias : pTab->zName);
drh5346e952013-05-08 14:14:26 +00001590 if( (p->wsFlags & WHERE_VIRTUALTABLE)==0 ){
drhf3f69ac2014-08-20 23:38:07 +00001591 const char *zName;
1592 if( p->u.btree.pIndex && (zName = p->u.btree.pIndex->zName)!=0 ){
drh319f6772013-05-14 15:31:07 +00001593 if( strncmp(zName, "sqlite_autoindex_", 17)==0 ){
1594 int i = sqlite3Strlen30(zName) - 1;
1595 while( zName[i]!='_' ) i--;
1596 zName += i;
1597 }
drh6457a352013-06-21 00:35:37 +00001598 sqlite3DebugPrintf(".%-16s %2d", zName, p->u.btree.nEq);
drh5346e952013-05-08 14:14:26 +00001599 }else{
drh6457a352013-06-21 00:35:37 +00001600 sqlite3DebugPrintf("%20s","");
drh5346e952013-05-08 14:14:26 +00001601 }
drha18f3d22013-05-08 03:05:41 +00001602 }else{
drh5346e952013-05-08 14:14:26 +00001603 char *z;
1604 if( p->u.vtab.idxStr ){
drh3bd26f02013-05-24 14:52:03 +00001605 z = sqlite3_mprintf("(%d,\"%s\",%x)",
1606 p->u.vtab.idxNum, p->u.vtab.idxStr, p->u.vtab.omitMask);
drh5346e952013-05-08 14:14:26 +00001607 }else{
drh3bd26f02013-05-24 14:52:03 +00001608 z = sqlite3_mprintf("(%d,%x)", p->u.vtab.idxNum, p->u.vtab.omitMask);
drh5346e952013-05-08 14:14:26 +00001609 }
drh6457a352013-06-21 00:35:37 +00001610 sqlite3DebugPrintf(" %-19s", z);
drh5346e952013-05-08 14:14:26 +00001611 sqlite3_free(z);
drha18f3d22013-05-08 03:05:41 +00001612 }
drhf3f69ac2014-08-20 23:38:07 +00001613 if( p->wsFlags & WHERE_SKIPSCAN ){
drhc8bbce12014-10-21 01:05:09 +00001614 sqlite3DebugPrintf(" f %05x %d-%d", p->wsFlags, p->nLTerm,p->nSkip);
drhf3f69ac2014-08-20 23:38:07 +00001615 }else{
1616 sqlite3DebugPrintf(" f %05x N %d", p->wsFlags, p->nLTerm);
1617 }
drhb8a8e8a2013-06-10 19:12:39 +00001618 sqlite3DebugPrintf(" cost %d,%d,%d\n", p->rSetup, p->rRun, p->nOut);
drhc90713d2014-09-30 13:46:49 +00001619 if( p->nLTerm && (sqlite3WhereTrace & 0x100)!=0 ){
1620 int i;
1621 for(i=0; i<p->nLTerm; i++){
drh0a99ba32014-09-30 17:03:35 +00001622 whereTermPrint(p->aLTerm[i], i);
drhc90713d2014-09-30 13:46:49 +00001623 }
1624 }
drha18f3d22013-05-08 03:05:41 +00001625}
1626#endif
1627
drhf1b5f5b2013-05-02 00:15:01 +00001628/*
drh4efc9292013-06-06 23:02:03 +00001629** Convert bulk memory into a valid WhereLoop that can be passed
1630** to whereLoopClear harmlessly.
drh5346e952013-05-08 14:14:26 +00001631*/
drh4efc9292013-06-06 23:02:03 +00001632static void whereLoopInit(WhereLoop *p){
1633 p->aLTerm = p->aLTermSpace;
1634 p->nLTerm = 0;
1635 p->nLSlot = ArraySize(p->aLTermSpace);
1636 p->wsFlags = 0;
1637}
1638
1639/*
1640** Clear the WhereLoop.u union. Leave WhereLoop.pLTerm intact.
1641*/
1642static void whereLoopClearUnion(sqlite3 *db, WhereLoop *p){
drh986b3872013-06-28 21:12:20 +00001643 if( p->wsFlags & (WHERE_VIRTUALTABLE|WHERE_AUTO_INDEX) ){
drh13e11b42013-06-06 23:44:25 +00001644 if( (p->wsFlags & WHERE_VIRTUALTABLE)!=0 && p->u.vtab.needFree ){
1645 sqlite3_free(p->u.vtab.idxStr);
1646 p->u.vtab.needFree = 0;
1647 p->u.vtab.idxStr = 0;
drh986b3872013-06-28 21:12:20 +00001648 }else if( (p->wsFlags & WHERE_AUTO_INDEX)!=0 && p->u.btree.pIndex!=0 ){
drh13e11b42013-06-06 23:44:25 +00001649 sqlite3DbFree(db, p->u.btree.pIndex->zColAff);
1650 sqlite3DbFree(db, p->u.btree.pIndex);
1651 p->u.btree.pIndex = 0;
1652 }
drh5346e952013-05-08 14:14:26 +00001653 }
1654}
1655
drh4efc9292013-06-06 23:02:03 +00001656/*
1657** Deallocate internal memory used by a WhereLoop object
1658*/
1659static void whereLoopClear(sqlite3 *db, WhereLoop *p){
1660 if( p->aLTerm!=p->aLTermSpace ) sqlite3DbFree(db, p->aLTerm);
1661 whereLoopClearUnion(db, p);
1662 whereLoopInit(p);
1663}
1664
1665/*
1666** Increase the memory allocation for pLoop->aLTerm[] to be at least n.
1667*/
1668static int whereLoopResize(sqlite3 *db, WhereLoop *p, int n){
1669 WhereTerm **paNew;
1670 if( p->nLSlot>=n ) return SQLITE_OK;
1671 n = (n+7)&~7;
1672 paNew = sqlite3DbMallocRaw(db, sizeof(p->aLTerm[0])*n);
1673 if( paNew==0 ) return SQLITE_NOMEM;
1674 memcpy(paNew, p->aLTerm, sizeof(p->aLTerm[0])*p->nLSlot);
1675 if( p->aLTerm!=p->aLTermSpace ) sqlite3DbFree(db, p->aLTerm);
1676 p->aLTerm = paNew;
1677 p->nLSlot = n;
1678 return SQLITE_OK;
1679}
1680
1681/*
1682** Transfer content from the second pLoop into the first.
1683*/
1684static int whereLoopXfer(sqlite3 *db, WhereLoop *pTo, WhereLoop *pFrom){
drh4efc9292013-06-06 23:02:03 +00001685 whereLoopClearUnion(db, pTo);
drh0d31dc32013-09-06 00:40:59 +00001686 if( whereLoopResize(db, pTo, pFrom->nLTerm) ){
1687 memset(&pTo->u, 0, sizeof(pTo->u));
1688 return SQLITE_NOMEM;
1689 }
drha2014152013-06-07 00:29:23 +00001690 memcpy(pTo, pFrom, WHERE_LOOP_XFER_SZ);
1691 memcpy(pTo->aLTerm, pFrom->aLTerm, pTo->nLTerm*sizeof(pTo->aLTerm[0]));
drh4efc9292013-06-06 23:02:03 +00001692 if( pFrom->wsFlags & WHERE_VIRTUALTABLE ){
1693 pFrom->u.vtab.needFree = 0;
drh986b3872013-06-28 21:12:20 +00001694 }else if( (pFrom->wsFlags & WHERE_AUTO_INDEX)!=0 ){
drh4efc9292013-06-06 23:02:03 +00001695 pFrom->u.btree.pIndex = 0;
1696 }
1697 return SQLITE_OK;
1698}
1699
drh5346e952013-05-08 14:14:26 +00001700/*
drhf1b5f5b2013-05-02 00:15:01 +00001701** Delete a WhereLoop object
1702*/
1703static void whereLoopDelete(sqlite3 *db, WhereLoop *p){
drh5346e952013-05-08 14:14:26 +00001704 whereLoopClear(db, p);
drhf1b5f5b2013-05-02 00:15:01 +00001705 sqlite3DbFree(db, p);
1706}
drh84bfda42005-07-15 13:05:21 +00001707
drh9eff6162006-06-12 21:59:13 +00001708/*
1709** Free a WhereInfo structure
1710*/
drh10fe8402008-10-11 16:47:35 +00001711static void whereInfoFree(sqlite3 *db, WhereInfo *pWInfo){
drh52ff8ea2010-04-08 14:15:56 +00001712 if( ALWAYS(pWInfo) ){
danf89aa472015-04-25 12:20:24 +00001713 int i;
1714 for(i=0; i<pWInfo->nLevel; i++){
1715 WhereLevel *pLevel = &pWInfo->a[i];
1716 if( pLevel->pWLoop && (pLevel->pWLoop->wsFlags & WHERE_IN_ABLE) ){
1717 sqlite3DbFree(db, pLevel->u.in.aInLoop);
1718 }
1719 }
drh6c1f4ef2015-06-08 14:23:15 +00001720 sqlite3WhereClauseClear(&pWInfo->sWC);
drhf1b5f5b2013-05-02 00:15:01 +00001721 while( pWInfo->pLoops ){
1722 WhereLoop *p = pWInfo->pLoops;
1723 pWInfo->pLoops = p->pNextLoop;
1724 whereLoopDelete(db, p);
1725 }
drh633e6d52008-07-28 19:34:53 +00001726 sqlite3DbFree(db, pWInfo);
drh9eff6162006-06-12 21:59:13 +00001727 }
1728}
1729
drhf1b5f5b2013-05-02 00:15:01 +00001730/*
drhe0de8762014-11-05 13:13:13 +00001731** Return TRUE if all of the following are true:
drhb355c2c2014-04-18 22:20:31 +00001732**
1733** (1) X has the same or lower cost that Y
1734** (2) X is a proper subset of Y
drhe0de8762014-11-05 13:13:13 +00001735** (3) X skips at least as many columns as Y
drhb355c2c2014-04-18 22:20:31 +00001736**
1737** By "proper subset" we mean that X uses fewer WHERE clause terms
1738** than Y and that every WHERE clause term used by X is also used
1739** by Y.
1740**
1741** If X is a proper subset of Y then Y is a better choice and ought
1742** to have a lower cost. This routine returns TRUE when that cost
drhe0de8762014-11-05 13:13:13 +00001743** relationship is inverted and needs to be adjusted. The third rule
1744** was added because if X uses skip-scan less than Y it still might
1745** deserve a lower cost even if it is a proper subset of Y.
drh3fb183d2014-03-31 19:49:00 +00001746*/
drhb355c2c2014-04-18 22:20:31 +00001747static int whereLoopCheaperProperSubset(
1748 const WhereLoop *pX, /* First WhereLoop to compare */
1749 const WhereLoop *pY /* Compare against this WhereLoop */
1750){
drh3fb183d2014-03-31 19:49:00 +00001751 int i, j;
drhc8bbce12014-10-21 01:05:09 +00001752 if( pX->nLTerm-pX->nSkip >= pY->nLTerm-pY->nSkip ){
1753 return 0; /* X is not a subset of Y */
1754 }
drhe0de8762014-11-05 13:13:13 +00001755 if( pY->nSkip > pX->nSkip ) return 0;
drhb355c2c2014-04-18 22:20:31 +00001756 if( pX->rRun >= pY->rRun ){
1757 if( pX->rRun > pY->rRun ) return 0; /* X costs more than Y */
1758 if( pX->nOut > pY->nOut ) return 0; /* X costs more than Y */
drh3fb183d2014-03-31 19:49:00 +00001759 }
drh9ee88102014-05-07 20:33:17 +00001760 for(i=pX->nLTerm-1; i>=0; i--){
drhc8bbce12014-10-21 01:05:09 +00001761 if( pX->aLTerm[i]==0 ) continue;
drhb355c2c2014-04-18 22:20:31 +00001762 for(j=pY->nLTerm-1; j>=0; j--){
1763 if( pY->aLTerm[j]==pX->aLTerm[i] ) break;
1764 }
1765 if( j<0 ) return 0; /* X not a subset of Y since term X[i] not used by Y */
1766 }
1767 return 1; /* All conditions meet */
drh3fb183d2014-03-31 19:49:00 +00001768}
1769
1770/*
1771** Try to adjust the cost of WhereLoop pTemplate upwards or downwards so
1772** that:
drh53cd10a2014-03-31 18:24:18 +00001773**
drh3fb183d2014-03-31 19:49:00 +00001774** (1) pTemplate costs less than any other WhereLoops that are a proper
1775** subset of pTemplate
drh53cd10a2014-03-31 18:24:18 +00001776**
drh3fb183d2014-03-31 19:49:00 +00001777** (2) pTemplate costs more than any other WhereLoops for which pTemplate
1778** is a proper subset.
drh53cd10a2014-03-31 18:24:18 +00001779**
drh3fb183d2014-03-31 19:49:00 +00001780** To say "WhereLoop X is a proper subset of Y" means that X uses fewer
1781** WHERE clause terms than Y and that every WHERE clause term used by X is
1782** also used by Y.
drh53cd10a2014-03-31 18:24:18 +00001783*/
1784static void whereLoopAdjustCost(const WhereLoop *p, WhereLoop *pTemplate){
1785 if( (pTemplate->wsFlags & WHERE_INDEXED)==0 ) return;
drh53cd10a2014-03-31 18:24:18 +00001786 for(; p; p=p->pNextLoop){
drh3fb183d2014-03-31 19:49:00 +00001787 if( p->iTab!=pTemplate->iTab ) continue;
1788 if( (p->wsFlags & WHERE_INDEXED)==0 ) continue;
drhb355c2c2014-04-18 22:20:31 +00001789 if( whereLoopCheaperProperSubset(p, pTemplate) ){
1790 /* Adjust pTemplate cost downward so that it is cheaper than its
drhe0de8762014-11-05 13:13:13 +00001791 ** subset p. */
drh1b131b72014-10-21 16:01:40 +00001792 WHERETRACE(0x80,("subset cost adjustment %d,%d to %d,%d\n",
1793 pTemplate->rRun, pTemplate->nOut, p->rRun, p->nOut-1));
drh3fb183d2014-03-31 19:49:00 +00001794 pTemplate->rRun = p->rRun;
1795 pTemplate->nOut = p->nOut - 1;
drhb355c2c2014-04-18 22:20:31 +00001796 }else if( whereLoopCheaperProperSubset(pTemplate, p) ){
1797 /* Adjust pTemplate cost upward so that it is costlier than p since
1798 ** pTemplate is a proper subset of p */
drh1b131b72014-10-21 16:01:40 +00001799 WHERETRACE(0x80,("subset cost adjustment %d,%d to %d,%d\n",
1800 pTemplate->rRun, pTemplate->nOut, p->rRun, p->nOut+1));
drh3fb183d2014-03-31 19:49:00 +00001801 pTemplate->rRun = p->rRun;
1802 pTemplate->nOut = p->nOut + 1;
drh53cd10a2014-03-31 18:24:18 +00001803 }
1804 }
1805}
1806
1807/*
drh7a4b1642014-03-29 21:16:07 +00001808** Search the list of WhereLoops in *ppPrev looking for one that can be
1809** supplanted by pTemplate.
drhf1b5f5b2013-05-02 00:15:01 +00001810**
drh7a4b1642014-03-29 21:16:07 +00001811** Return NULL if the WhereLoop list contains an entry that can supplant
1812** pTemplate, in other words if pTemplate does not belong on the list.
drh23f98da2013-05-21 15:52:07 +00001813**
drh7a4b1642014-03-29 21:16:07 +00001814** If pX is a WhereLoop that pTemplate can supplant, then return the
1815** link that points to pX.
drh23f98da2013-05-21 15:52:07 +00001816**
drh7a4b1642014-03-29 21:16:07 +00001817** If pTemplate cannot supplant any existing element of the list but needs
1818** to be added to the list, then return a pointer to the tail of the list.
drhf1b5f5b2013-05-02 00:15:01 +00001819*/
drh7a4b1642014-03-29 21:16:07 +00001820static WhereLoop **whereLoopFindLesser(
1821 WhereLoop **ppPrev,
1822 const WhereLoop *pTemplate
1823){
1824 WhereLoop *p;
1825 for(p=(*ppPrev); p; ppPrev=&p->pNextLoop, p=*ppPrev){
drhdbb80232013-06-19 12:34:13 +00001826 if( p->iTab!=pTemplate->iTab || p->iSortIdx!=pTemplate->iSortIdx ){
1827 /* If either the iTab or iSortIdx values for two WhereLoop are different
1828 ** then those WhereLoops need to be considered separately. Neither is
1829 ** a candidate to replace the other. */
1830 continue;
1831 }
1832 /* In the current implementation, the rSetup value is either zero
1833 ** or the cost of building an automatic index (NlogN) and the NlogN
1834 ** is the same for compatible WhereLoops. */
1835 assert( p->rSetup==0 || pTemplate->rSetup==0
1836 || p->rSetup==pTemplate->rSetup );
1837
1838 /* whereLoopAddBtree() always generates and inserts the automatic index
1839 ** case first. Hence compatible candidate WhereLoops never have a larger
1840 ** rSetup. Call this SETUP-INVARIANT */
1841 assert( p->rSetup>=pTemplate->rSetup );
1842
drhdabe36d2014-06-17 20:16:43 +00001843 /* Any loop using an appliation-defined index (or PRIMARY KEY or
1844 ** UNIQUE constraint) with one or more == constraints is better
dan70273d02014-11-14 19:34:20 +00001845 ** than an automatic index. Unless it is a skip-scan. */
drhdabe36d2014-06-17 20:16:43 +00001846 if( (p->wsFlags & WHERE_AUTO_INDEX)!=0
dan70273d02014-11-14 19:34:20 +00001847 && (pTemplate->nSkip)==0
drhdabe36d2014-06-17 20:16:43 +00001848 && (pTemplate->wsFlags & WHERE_INDEXED)!=0
1849 && (pTemplate->wsFlags & WHERE_COLUMN_EQ)!=0
1850 && (p->prereq & pTemplate->prereq)==pTemplate->prereq
1851 ){
1852 break;
1853 }
1854
drh53cd10a2014-03-31 18:24:18 +00001855 /* If existing WhereLoop p is better than pTemplate, pTemplate can be
1856 ** discarded. WhereLoop p is better if:
1857 ** (1) p has no more dependencies than pTemplate, and
1858 ** (2) p has an equal or lower cost than pTemplate
1859 */
1860 if( (p->prereq & pTemplate->prereq)==p->prereq /* (1) */
1861 && p->rSetup<=pTemplate->rSetup /* (2a) */
1862 && p->rRun<=pTemplate->rRun /* (2b) */
1863 && p->nOut<=pTemplate->nOut /* (2c) */
drhf1b5f5b2013-05-02 00:15:01 +00001864 ){
drh53cd10a2014-03-31 18:24:18 +00001865 return 0; /* Discard pTemplate */
drhf1b5f5b2013-05-02 00:15:01 +00001866 }
drh53cd10a2014-03-31 18:24:18 +00001867
1868 /* If pTemplate is always better than p, then cause p to be overwritten
1869 ** with pTemplate. pTemplate is better than p if:
1870 ** (1) pTemplate has no more dependences than p, and
1871 ** (2) pTemplate has an equal or lower cost than p.
1872 */
1873 if( (p->prereq & pTemplate->prereq)==pTemplate->prereq /* (1) */
1874 && p->rRun>=pTemplate->rRun /* (2a) */
1875 && p->nOut>=pTemplate->nOut /* (2b) */
drhf1b5f5b2013-05-02 00:15:01 +00001876 ){
drhadd5ce32013-09-07 00:29:06 +00001877 assert( p->rSetup>=pTemplate->rSetup ); /* SETUP-INVARIANT above */
drh53cd10a2014-03-31 18:24:18 +00001878 break; /* Cause p to be overwritten by pTemplate */
drhf1b5f5b2013-05-02 00:15:01 +00001879 }
1880 }
drh7a4b1642014-03-29 21:16:07 +00001881 return ppPrev;
1882}
1883
1884/*
drh94a11212004-09-25 13:12:14 +00001885** Insert or replace a WhereLoop entry using the template supplied.
1886**
1887** An existing WhereLoop entry might be overwritten if the new template
1888** is better and has fewer dependencies. Or the template will be ignored
1889** and no insert will occur if an existing WhereLoop is faster and has
1890** fewer dependencies than the template. Otherwise a new WhereLoop is
danielk1977b3bce662005-01-29 08:32:43 +00001891** added based on the template.
drh94a11212004-09-25 13:12:14 +00001892**
drh7a4b1642014-03-29 21:16:07 +00001893** If pBuilder->pOrSet is not NULL then we care about only the
drh94a11212004-09-25 13:12:14 +00001894** prerequisites and rRun and nOut costs of the N best loops. That
1895** information is gathered in the pBuilder->pOrSet object. This special
1896** processing mode is used only for OR clause processing.
danielk1977b3bce662005-01-29 08:32:43 +00001897**
drh94a11212004-09-25 13:12:14 +00001898** When accumulating multiple loops (when pBuilder->pOrSet is NULL) we
danielk1977b3bce662005-01-29 08:32:43 +00001899** still might overwrite similar loops with the new template if the
drh53cd10a2014-03-31 18:24:18 +00001900** new template is better. Loops may be overwritten if the following
drh94a11212004-09-25 13:12:14 +00001901** conditions are met:
1902**
1903** (1) They have the same iTab.
1904** (2) They have the same iSortIdx.
1905** (3) The template has same or fewer dependencies than the current loop
1906** (4) The template has the same or lower cost than the current loop
drh94a11212004-09-25 13:12:14 +00001907*/
1908static int whereLoopInsert(WhereLoopBuilder *pBuilder, WhereLoop *pTemplate){
drh7a4b1642014-03-29 21:16:07 +00001909 WhereLoop **ppPrev, *p;
drh94a11212004-09-25 13:12:14 +00001910 WhereInfo *pWInfo = pBuilder->pWInfo;
1911 sqlite3 *db = pWInfo->pParse->db;
1912
1913 /* If pBuilder->pOrSet is defined, then only keep track of the costs
1914 ** and prereqs.
1915 */
1916 if( pBuilder->pOrSet!=0 ){
1917#if WHERETRACE_ENABLED
1918 u16 n = pBuilder->pOrSet->n;
1919 int x =
1920#endif
danielk1977b3bce662005-01-29 08:32:43 +00001921 whereOrInsert(pBuilder->pOrSet, pTemplate->prereq, pTemplate->rRun,
1922 pTemplate->nOut);
1923#if WHERETRACE_ENABLED /* 0x8 */
drh94a11212004-09-25 13:12:14 +00001924 if( sqlite3WhereTrace & 0x8 ){
danielk1977b3bce662005-01-29 08:32:43 +00001925 sqlite3DebugPrintf(x?" or-%d: ":" or-X: ", n);
drh9012bcb2004-12-19 00:11:35 +00001926 whereLoopPrint(pTemplate, pBuilder->pWC);
drh94a11212004-09-25 13:12:14 +00001927 }
1928#endif
danielk1977b3bce662005-01-29 08:32:43 +00001929 return SQLITE_OK;
drh94a11212004-09-25 13:12:14 +00001930 }
1931
drh7a4b1642014-03-29 21:16:07 +00001932 /* Look for an existing WhereLoop to replace with pTemplate
drh51669862004-12-18 18:40:26 +00001933 */
drh53cd10a2014-03-31 18:24:18 +00001934 whereLoopAdjustCost(pWInfo->pLoops, pTemplate);
drh7a4b1642014-03-29 21:16:07 +00001935 ppPrev = whereLoopFindLesser(&pWInfo->pLoops, pTemplate);
drhf1b5f5b2013-05-02 00:15:01 +00001936
drh7a4b1642014-03-29 21:16:07 +00001937 if( ppPrev==0 ){
1938 /* There already exists a WhereLoop on the list that is better
1939 ** than pTemplate, so just ignore pTemplate */
1940#if WHERETRACE_ENABLED /* 0x8 */
1941 if( sqlite3WhereTrace & 0x8 ){
drh9a7b41d2014-10-08 00:08:08 +00001942 sqlite3DebugPrintf(" skip: ");
drh7a4b1642014-03-29 21:16:07 +00001943 whereLoopPrint(pTemplate, pBuilder->pWC);
drhf1b5f5b2013-05-02 00:15:01 +00001944 }
drh7a4b1642014-03-29 21:16:07 +00001945#endif
1946 return SQLITE_OK;
1947 }else{
1948 p = *ppPrev;
drhf1b5f5b2013-05-02 00:15:01 +00001949 }
1950
1951 /* If we reach this point it means that either p[] should be overwritten
1952 ** with pTemplate[] if p[] exists, or if p==NULL then allocate a new
1953 ** WhereLoop and insert it.
1954 */
drh989578e2013-10-28 14:34:35 +00001955#if WHERETRACE_ENABLED /* 0x8 */
drhae70cf12013-05-31 15:18:46 +00001956 if( sqlite3WhereTrace & 0x8 ){
1957 if( p!=0 ){
drh9a7b41d2014-10-08 00:08:08 +00001958 sqlite3DebugPrintf("replace: ");
drhc1ba2e72013-10-28 19:03:21 +00001959 whereLoopPrint(p, pBuilder->pWC);
drhae70cf12013-05-31 15:18:46 +00001960 }
drh9a7b41d2014-10-08 00:08:08 +00001961 sqlite3DebugPrintf(" add: ");
drhc1ba2e72013-10-28 19:03:21 +00001962 whereLoopPrint(pTemplate, pBuilder->pWC);
drhae70cf12013-05-31 15:18:46 +00001963 }
1964#endif
drhf1b5f5b2013-05-02 00:15:01 +00001965 if( p==0 ){
drh7a4b1642014-03-29 21:16:07 +00001966 /* Allocate a new WhereLoop to add to the end of the list */
1967 *ppPrev = p = sqlite3DbMallocRaw(db, sizeof(WhereLoop));
drhf1b5f5b2013-05-02 00:15:01 +00001968 if( p==0 ) return SQLITE_NOMEM;
drh4efc9292013-06-06 23:02:03 +00001969 whereLoopInit(p);
drh7a4b1642014-03-29 21:16:07 +00001970 p->pNextLoop = 0;
1971 }else{
1972 /* We will be overwriting WhereLoop p[]. But before we do, first
1973 ** go through the rest of the list and delete any other entries besides
1974 ** p[] that are also supplated by pTemplate */
1975 WhereLoop **ppTail = &p->pNextLoop;
1976 WhereLoop *pToDel;
1977 while( *ppTail ){
1978 ppTail = whereLoopFindLesser(ppTail, pTemplate);
drhdabe36d2014-06-17 20:16:43 +00001979 if( ppTail==0 ) break;
drh7a4b1642014-03-29 21:16:07 +00001980 pToDel = *ppTail;
1981 if( pToDel==0 ) break;
1982 *ppTail = pToDel->pNextLoop;
1983#if WHERETRACE_ENABLED /* 0x8 */
1984 if( sqlite3WhereTrace & 0x8 ){
drh9a7b41d2014-10-08 00:08:08 +00001985 sqlite3DebugPrintf(" delete: ");
drh7a4b1642014-03-29 21:16:07 +00001986 whereLoopPrint(pToDel, pBuilder->pWC);
1987 }
1988#endif
1989 whereLoopDelete(db, pToDel);
1990 }
drhf1b5f5b2013-05-02 00:15:01 +00001991 }
drh4efc9292013-06-06 23:02:03 +00001992 whereLoopXfer(db, p, pTemplate);
drh5346e952013-05-08 14:14:26 +00001993 if( (p->wsFlags & WHERE_VIRTUALTABLE)==0 ){
drhef866372013-05-22 20:49:02 +00001994 Index *pIndex = p->u.btree.pIndex;
1995 if( pIndex && pIndex->tnum==0 ){
drhcf8fa7a2013-05-10 20:26:22 +00001996 p->u.btree.pIndex = 0;
1997 }
drh5346e952013-05-08 14:14:26 +00001998 }
drhf1b5f5b2013-05-02 00:15:01 +00001999 return SQLITE_OK;
2000}
2001
2002/*
drhcca9f3d2013-09-06 15:23:29 +00002003** Adjust the WhereLoop.nOut value downward to account for terms of the
2004** WHERE clause that reference the loop but which are not used by an
2005** index.
drh7a1bca72014-11-22 18:50:44 +00002006*
2007** For every WHERE clause term that is not used by the index
2008** and which has a truth probability assigned by one of the likelihood(),
2009** likely(), or unlikely() SQL functions, reduce the estimated number
2010** of output rows by the probability specified.
drhcca9f3d2013-09-06 15:23:29 +00002011**
drh7a1bca72014-11-22 18:50:44 +00002012** TUNING: For every WHERE clause term that is not used by the index
2013** and which does not have an assigned truth probability, heuristics
2014** described below are used to try to estimate the truth probability.
2015** TODO --> Perhaps this is something that could be improved by better
2016** table statistics.
2017**
drhab4624d2014-11-22 19:52:10 +00002018** Heuristic 1: Estimate the truth probability as 93.75%. The 93.75%
2019** value corresponds to -1 in LogEst notation, so this means decrement
drh7a1bca72014-11-22 18:50:44 +00002020** the WhereLoop.nOut field for every such WHERE clause term.
2021**
2022** Heuristic 2: If there exists one or more WHERE clause terms of the
2023** form "x==EXPR" and EXPR is not a constant 0 or 1, then make sure the
2024** final output row estimate is no greater than 1/4 of the total number
2025** of rows in the table. In other words, assume that x==EXPR will filter
2026** out at least 3 out of 4 rows. If EXPR is -1 or 0 or 1, then maybe the
2027** "x" column is boolean or else -1 or 0 or 1 is a common default value
2028** on the "x" column and so in that case only cap the output row estimate
2029** at 1/2 instead of 1/4.
drhcca9f3d2013-09-06 15:23:29 +00002030*/
drhd8b77e22014-09-06 01:35:57 +00002031static void whereLoopOutputAdjust(
2032 WhereClause *pWC, /* The WHERE clause */
2033 WhereLoop *pLoop, /* The loop to adjust downward */
2034 LogEst nRow /* Number of rows in the entire table */
2035){
drh7d9e7d82013-09-11 17:39:09 +00002036 WhereTerm *pTerm, *pX;
drhcca9f3d2013-09-06 15:23:29 +00002037 Bitmask notAllowed = ~(pLoop->prereq|pLoop->maskSelf);
drh7a1bca72014-11-22 18:50:44 +00002038 int i, j, k;
2039 LogEst iReduce = 0; /* pLoop->nOut should not exceed nRow-iReduce */
drhadd5ce32013-09-07 00:29:06 +00002040
drha3898252014-11-22 12:22:13 +00002041 assert( (pLoop->wsFlags & WHERE_AUTO_INDEX)==0 );
drhcca9f3d2013-09-06 15:23:29 +00002042 for(i=pWC->nTerm, pTerm=pWC->a; i>0; i--, pTerm++){
drh7d9e7d82013-09-11 17:39:09 +00002043 if( (pTerm->wtFlags & TERM_VIRTUAL)!=0 ) break;
drhcca9f3d2013-09-06 15:23:29 +00002044 if( (pTerm->prereqAll & pLoop->maskSelf)==0 ) continue;
2045 if( (pTerm->prereqAll & notAllowed)!=0 ) continue;
drh7d9e7d82013-09-11 17:39:09 +00002046 for(j=pLoop->nLTerm-1; j>=0; j--){
2047 pX = pLoop->aLTerm[j];
drhd2447442013-11-13 19:01:41 +00002048 if( pX==0 ) continue;
drh7d9e7d82013-09-11 17:39:09 +00002049 if( pX==pTerm ) break;
2050 if( pX->iParent>=0 && (&pWC->a[pX->iParent])==pTerm ) break;
2051 }
danaa9933c2014-04-24 20:04:49 +00002052 if( j<0 ){
drhd8b77e22014-09-06 01:35:57 +00002053 if( pTerm->truthProb<=0 ){
drh7a1bca72014-11-22 18:50:44 +00002054 /* If a truth probability is specified using the likelihood() hints,
2055 ** then use the probability provided by the application. */
drhd8b77e22014-09-06 01:35:57 +00002056 pLoop->nOut += pTerm->truthProb;
2057 }else{
drh7a1bca72014-11-22 18:50:44 +00002058 /* In the absence of explicit truth probabilities, use heuristics to
2059 ** guess a reasonable truth probability. */
drhd8b77e22014-09-06 01:35:57 +00002060 pLoop->nOut--;
drhe8d0c612015-05-14 01:05:25 +00002061 if( pTerm->eOperator&(WO_EQ|WO_IS) ){
drh7a1bca72014-11-22 18:50:44 +00002062 Expr *pRight = pTerm->pExpr->pRight;
drhe0cc3c22015-05-13 17:54:08 +00002063 testcase( pTerm->pExpr->op==TK_IS );
drh7a1bca72014-11-22 18:50:44 +00002064 if( sqlite3ExprIsInteger(pRight, &k) && k>=(-1) && k<=1 ){
2065 k = 10;
2066 }else{
2067 k = 20;
2068 }
2069 if( iReduce<k ) iReduce = k;
2070 }
drhd8b77e22014-09-06 01:35:57 +00002071 }
danaa9933c2014-04-24 20:04:49 +00002072 }
drhcca9f3d2013-09-06 15:23:29 +00002073 }
drh7a1bca72014-11-22 18:50:44 +00002074 if( pLoop->nOut > nRow-iReduce ) pLoop->nOut = nRow - iReduce;
drhcca9f3d2013-09-06 15:23:29 +00002075}
2076
2077/*
drhdbd94862014-07-23 23:57:42 +00002078** Adjust the cost C by the costMult facter T. This only occurs if
2079** compiled with -DSQLITE_ENABLE_COSTMULT
2080*/
2081#ifdef SQLITE_ENABLE_COSTMULT
2082# define ApplyCostMultiplier(C,T) C += T
2083#else
2084# define ApplyCostMultiplier(C,T)
2085#endif
2086
2087/*
dan4a6b8a02014-04-30 14:47:01 +00002088** We have so far matched pBuilder->pNew->u.btree.nEq terms of the
2089** index pIndex. Try to match one more.
2090**
2091** When this function is called, pBuilder->pNew->nOut contains the
2092** number of rows expected to be visited by filtering using the nEq
2093** terms only. If it is modified, this value is restored before this
2094** function returns.
drh1c8148f2013-05-04 20:25:23 +00002095**
2096** If pProbe->tnum==0, that means pIndex is a fake index used for the
2097** INTEGER PRIMARY KEY.
2098*/
drh5346e952013-05-08 14:14:26 +00002099static int whereLoopAddBtreeIndex(
drh1c8148f2013-05-04 20:25:23 +00002100 WhereLoopBuilder *pBuilder, /* The WhereLoop factory */
2101 struct SrcList_item *pSrc, /* FROM clause term being analyzed */
2102 Index *pProbe, /* An index on pSrc */
drhbf539c42013-10-05 18:16:02 +00002103 LogEst nInMul /* log(Number of iterations due to IN) */
drh1c8148f2013-05-04 20:25:23 +00002104){
drh70d18342013-06-06 19:16:33 +00002105 WhereInfo *pWInfo = pBuilder->pWInfo; /* WHERE analyse context */
2106 Parse *pParse = pWInfo->pParse; /* Parsing context */
2107 sqlite3 *db = pParse->db; /* Database connection malloc context */
drh1c8148f2013-05-04 20:25:23 +00002108 WhereLoop *pNew; /* Template WhereLoop under construction */
2109 WhereTerm *pTerm; /* A WhereTerm under consideration */
drh43fe25f2013-05-07 23:06:23 +00002110 int opMask; /* Valid operators for constraints */
drh1c8148f2013-05-04 20:25:23 +00002111 WhereScan scan; /* Iterator for WHERE terms */
drh4efc9292013-06-06 23:02:03 +00002112 Bitmask saved_prereq; /* Original value of pNew->prereq */
2113 u16 saved_nLTerm; /* Original value of pNew->nLTerm */
drhcd8629e2013-11-13 12:27:25 +00002114 u16 saved_nEq; /* Original value of pNew->u.btree.nEq */
drhc8bbce12014-10-21 01:05:09 +00002115 u16 saved_nSkip; /* Original value of pNew->nSkip */
drh4efc9292013-06-06 23:02:03 +00002116 u32 saved_wsFlags; /* Original value of pNew->wsFlags */
drhbf539c42013-10-05 18:16:02 +00002117 LogEst saved_nOut; /* Original value of pNew->nOut */
drha18f3d22013-05-08 03:05:41 +00002118 int iCol; /* Index of the column in the table */
drh5346e952013-05-08 14:14:26 +00002119 int rc = SQLITE_OK; /* Return code */
drhd8b77e22014-09-06 01:35:57 +00002120 LogEst rSize; /* Number of rows in the table */
drhbf539c42013-10-05 18:16:02 +00002121 LogEst rLogSize; /* Logarithm of table size */
drhc7f0d222013-06-19 03:27:12 +00002122 WhereTerm *pTop = 0, *pBtm = 0; /* Top and bottom range constraints */
drh1c8148f2013-05-04 20:25:23 +00002123
drh1c8148f2013-05-04 20:25:23 +00002124 pNew = pBuilder->pNew;
drh5346e952013-05-08 14:14:26 +00002125 if( db->mallocFailed ) return SQLITE_NOMEM;
drh1c8148f2013-05-04 20:25:23 +00002126
drh5346e952013-05-08 14:14:26 +00002127 assert( (pNew->wsFlags & WHERE_VIRTUALTABLE)==0 );
drh43fe25f2013-05-07 23:06:23 +00002128 assert( (pNew->wsFlags & WHERE_TOP_LIMIT)==0 );
2129 if( pNew->wsFlags & WHERE_BTM_LIMIT ){
2130 opMask = WO_LT|WO_LE;
drh8a48b9c2015-08-19 15:20:00 +00002131 }else if( /*pProbe->tnum<=0 ||*/ (pSrc->fg.jointype & JT_LEFT)!=0 ){
drh43fe25f2013-05-07 23:06:23 +00002132 opMask = WO_EQ|WO_IN|WO_GT|WO_GE|WO_LT|WO_LE;
drh1c8148f2013-05-04 20:25:23 +00002133 }else{
drhe8d0c612015-05-14 01:05:25 +00002134 opMask = WO_EQ|WO_IN|WO_GT|WO_GE|WO_LT|WO_LE|WO_ISNULL|WO_IS;
drh1c8148f2013-05-04 20:25:23 +00002135 }
drhef866372013-05-22 20:49:02 +00002136 if( pProbe->bUnordered ) opMask &= ~(WO_GT|WO_GE|WO_LT|WO_LE);
drh1c8148f2013-05-04 20:25:23 +00002137
dan39129ce2014-06-30 15:23:57 +00002138 assert( pNew->u.btree.nEq<pProbe->nColumn );
2139 iCol = pProbe->aiColumn[pNew->u.btree.nEq];
2140
drha18f3d22013-05-08 03:05:41 +00002141 pTerm = whereScanInit(&scan, pBuilder->pWC, pSrc->iCursor, iCol,
drh0f133a42013-05-22 17:01:17 +00002142 opMask, pProbe);
drh4efc9292013-06-06 23:02:03 +00002143 saved_nEq = pNew->u.btree.nEq;
drhc8bbce12014-10-21 01:05:09 +00002144 saved_nSkip = pNew->nSkip;
drh4efc9292013-06-06 23:02:03 +00002145 saved_nLTerm = pNew->nLTerm;
2146 saved_wsFlags = pNew->wsFlags;
2147 saved_prereq = pNew->prereq;
2148 saved_nOut = pNew->nOut;
drhb8a8e8a2013-06-10 19:12:39 +00002149 pNew->rSetup = 0;
drhd8b77e22014-09-06 01:35:57 +00002150 rSize = pProbe->aiRowLogEst[0];
2151 rLogSize = estLog(rSize);
drh5346e952013-05-08 14:14:26 +00002152 for(; rc==SQLITE_OK && pTerm!=0; pTerm = whereScanNext(&scan)){
dan8ad1d8b2014-04-25 20:22:45 +00002153 u16 eOp = pTerm->eOperator; /* Shorthand for pTerm->eOperator */
danaa9933c2014-04-24 20:04:49 +00002154 LogEst rCostIdx;
dan8ad1d8b2014-04-25 20:22:45 +00002155 LogEst nOutUnadjusted; /* nOut before IN() and WHERE adjustments */
drhb8a8e8a2013-06-10 19:12:39 +00002156 int nIn = 0;
drh1435a9a2013-08-27 23:15:44 +00002157#ifdef SQLITE_ENABLE_STAT3_OR_STAT4
dan7a419232013-08-06 20:01:43 +00002158 int nRecValid = pBuilder->nRecValid;
drhb5246e52013-07-08 21:12:57 +00002159#endif
dan8ad1d8b2014-04-25 20:22:45 +00002160 if( (eOp==WO_ISNULL || (pTerm->wtFlags&TERM_VNULL)!=0)
dan8bff07a2013-08-29 14:56:14 +00002161 && (iCol<0 || pSrc->pTab->aCol[iCol].notNull)
2162 ){
2163 continue; /* ignore IS [NOT] NULL constraints on NOT NULL columns */
2164 }
dan7a419232013-08-06 20:01:43 +00002165 if( pTerm->prereqRight & pNew->maskSelf ) continue;
2166
drha40da622015-03-09 12:11:56 +00002167 /* Do not allow the upper bound of a LIKE optimization range constraint
2168 ** to mix with a lower range bound from some other source */
2169 if( pTerm->wtFlags & TERM_LIKEOPT && pTerm->eOperator==WO_LT ) continue;
2170
drh4efc9292013-06-06 23:02:03 +00002171 pNew->wsFlags = saved_wsFlags;
2172 pNew->u.btree.nEq = saved_nEq;
2173 pNew->nLTerm = saved_nLTerm;
2174 if( whereLoopResize(db, pNew, pNew->nLTerm+1) ) break; /* OOM */
2175 pNew->aLTerm[pNew->nLTerm++] = pTerm;
2176 pNew->prereq = (saved_prereq | pTerm->prereqRight) & ~pNew->maskSelf;
dan8ad1d8b2014-04-25 20:22:45 +00002177
2178 assert( nInMul==0
2179 || (pNew->wsFlags & WHERE_COLUMN_NULL)!=0
2180 || (pNew->wsFlags & WHERE_COLUMN_IN)!=0
2181 || (pNew->wsFlags & WHERE_SKIPSCAN)!=0
2182 );
2183
2184 if( eOp & WO_IN ){
drha18f3d22013-05-08 03:05:41 +00002185 Expr *pExpr = pTerm->pExpr;
2186 pNew->wsFlags |= WHERE_COLUMN_IN;
2187 if( ExprHasProperty(pExpr, EP_xIsSelect) ){
drhe1e2e9a2013-06-13 15:16:53 +00002188 /* "x IN (SELECT ...)": TUNING: the SELECT returns 25 rows */
drhbf539c42013-10-05 18:16:02 +00002189 nIn = 46; assert( 46==sqlite3LogEst(25) );
drha18f3d22013-05-08 03:05:41 +00002190 }else if( ALWAYS(pExpr->x.pList && pExpr->x.pList->nExpr) ){
2191 /* "x IN (value, value, ...)" */
drhbf539c42013-10-05 18:16:02 +00002192 nIn = sqlite3LogEst(pExpr->x.pList->nExpr);
drhf1645f02013-05-07 19:44:38 +00002193 }
drh2b59b3a2014-03-20 13:26:47 +00002194 assert( nIn>0 ); /* RHS always has 2 or more terms... The parser
2195 ** changes "x IN (?)" into "x=?". */
dan8ad1d8b2014-04-25 20:22:45 +00002196
drhe8d0c612015-05-14 01:05:25 +00002197 }else if( eOp & (WO_EQ|WO_IS) ){
drha18f3d22013-05-08 03:05:41 +00002198 pNew->wsFlags |= WHERE_COLUMN_EQ;
dan8ad1d8b2014-04-25 20:22:45 +00002199 if( iCol<0 || (nInMul==0 && pNew->u.btree.nEq==pProbe->nKeyCol-1) ){
dan2813bde2015-04-11 11:44:27 +00002200 if( iCol>=0 && pProbe->uniqNotNull==0 ){
drhe39a7322014-02-03 14:04:11 +00002201 pNew->wsFlags |= WHERE_UNQ_WANTED;
2202 }else{
2203 pNew->wsFlags |= WHERE_ONEROW;
2204 }
drh21f7ff72013-06-03 15:07:23 +00002205 }
dan2dd3cdc2014-04-26 20:21:14 +00002206 }else if( eOp & WO_ISNULL ){
2207 pNew->wsFlags |= WHERE_COLUMN_NULL;
dan8ad1d8b2014-04-25 20:22:45 +00002208 }else if( eOp & (WO_GT|WO_GE) ){
2209 testcase( eOp & WO_GT );
2210 testcase( eOp & WO_GE );
drha18f3d22013-05-08 03:05:41 +00002211 pNew->wsFlags |= WHERE_COLUMN_RANGE|WHERE_BTM_LIMIT;
drh6f2bfad2013-06-03 17:35:22 +00002212 pBtm = pTerm;
2213 pTop = 0;
drha40da622015-03-09 12:11:56 +00002214 if( pTerm->wtFlags & TERM_LIKEOPT ){
drh80314622015-03-09 13:01:02 +00002215 /* Range contraints that come from the LIKE optimization are
2216 ** always used in pairs. */
drha40da622015-03-09 12:11:56 +00002217 pTop = &pTerm[1];
2218 assert( (pTop-(pTerm->pWC->a))<pTerm->pWC->nTerm );
2219 assert( pTop->wtFlags & TERM_LIKEOPT );
2220 assert( pTop->eOperator==WO_LT );
2221 if( whereLoopResize(db, pNew, pNew->nLTerm+1) ) break; /* OOM */
2222 pNew->aLTerm[pNew->nLTerm++] = pTop;
2223 pNew->wsFlags |= WHERE_TOP_LIMIT;
2224 }
dan2dd3cdc2014-04-26 20:21:14 +00002225 }else{
dan8ad1d8b2014-04-25 20:22:45 +00002226 assert( eOp & (WO_LT|WO_LE) );
2227 testcase( eOp & WO_LT );
2228 testcase( eOp & WO_LE );
drha18f3d22013-05-08 03:05:41 +00002229 pNew->wsFlags |= WHERE_COLUMN_RANGE|WHERE_TOP_LIMIT;
drh6f2bfad2013-06-03 17:35:22 +00002230 pTop = pTerm;
2231 pBtm = (pNew->wsFlags & WHERE_BTM_LIMIT)!=0 ?
drh4efc9292013-06-06 23:02:03 +00002232 pNew->aLTerm[pNew->nLTerm-2] : 0;
drh1c8148f2013-05-04 20:25:23 +00002233 }
dan8ad1d8b2014-04-25 20:22:45 +00002234
2235 /* At this point pNew->nOut is set to the number of rows expected to
2236 ** be visited by the index scan before considering term pTerm, or the
2237 ** values of nIn and nInMul. In other words, assuming that all
2238 ** "x IN(...)" terms are replaced with "x = ?". This block updates
2239 ** the value of pNew->nOut to account for pTerm (but not nIn/nInMul). */
2240 assert( pNew->nOut==saved_nOut );
drh6f2bfad2013-06-03 17:35:22 +00002241 if( pNew->wsFlags & WHERE_COLUMN_RANGE ){
danaa9933c2014-04-24 20:04:49 +00002242 /* Adjust nOut using stat3/stat4 data. Or, if there is no stat3/stat4
2243 ** data, using some other estimate. */
drh186ad8c2013-10-08 18:40:37 +00002244 whereRangeScanEst(pParse, pBuilder, pBtm, pTop, pNew);
dan8ad1d8b2014-04-25 20:22:45 +00002245 }else{
2246 int nEq = ++pNew->u.btree.nEq;
drhe8d0c612015-05-14 01:05:25 +00002247 assert( eOp & (WO_ISNULL|WO_EQ|WO_IN|WO_IS) );
dan8ad1d8b2014-04-25 20:22:45 +00002248
2249 assert( pNew->nOut==saved_nOut );
dan09e1df62014-04-29 16:10:22 +00002250 if( pTerm->truthProb<=0 && iCol>=0 ){
dan8ad1d8b2014-04-25 20:22:45 +00002251 assert( (eOp & WO_IN) || nIn==0 );
drhc5f246e2014-05-01 20:24:21 +00002252 testcase( eOp & WO_IN );
dan8ad1d8b2014-04-25 20:22:45 +00002253 pNew->nOut += pTerm->truthProb;
2254 pNew->nOut -= nIn;
dan8ad1d8b2014-04-25 20:22:45 +00002255 }else{
drh1435a9a2013-08-27 23:15:44 +00002256#ifdef SQLITE_ENABLE_STAT3_OR_STAT4
dan8ad1d8b2014-04-25 20:22:45 +00002257 tRowcnt nOut = 0;
2258 if( nInMul==0
2259 && pProbe->nSample
2260 && pNew->u.btree.nEq<=pProbe->nSampleCol
dan8ad1d8b2014-04-25 20:22:45 +00002261 && ((eOp & WO_IN)==0 || !ExprHasProperty(pTerm->pExpr, EP_xIsSelect))
dan8ad1d8b2014-04-25 20:22:45 +00002262 ){
2263 Expr *pExpr = pTerm->pExpr;
drhe8d0c612015-05-14 01:05:25 +00002264 if( (eOp & (WO_EQ|WO_ISNULL|WO_IS))!=0 ){
2265 testcase( eOp & WO_EQ );
2266 testcase( eOp & WO_IS );
dan8ad1d8b2014-04-25 20:22:45 +00002267 testcase( eOp & WO_ISNULL );
2268 rc = whereEqualScanEst(pParse, pBuilder, pExpr->pRight, &nOut);
2269 }else{
2270 rc = whereInScanEst(pParse, pBuilder, pExpr->x.pList, &nOut);
2271 }
dan8ad1d8b2014-04-25 20:22:45 +00002272 if( rc==SQLITE_NOTFOUND ) rc = SQLITE_OK;
2273 if( rc!=SQLITE_OK ) break; /* Jump out of the pTerm loop */
2274 if( nOut ){
2275 pNew->nOut = sqlite3LogEst(nOut);
2276 if( pNew->nOut>saved_nOut ) pNew->nOut = saved_nOut;
2277 pNew->nOut -= nIn;
2278 }
2279 }
2280 if( nOut==0 )
2281#endif
2282 {
2283 pNew->nOut += (pProbe->aiRowLogEst[nEq] - pProbe->aiRowLogEst[nEq-1]);
2284 if( eOp & WO_ISNULL ){
2285 /* TUNING: If there is no likelihood() value, assume that a
2286 ** "col IS NULL" expression matches twice as many rows
2287 ** as (col=?). */
2288 pNew->nOut += 10;
2289 }
2290 }
dan6cb8d762013-08-08 11:48:57 +00002291 }
drh6f2bfad2013-06-03 17:35:22 +00002292 }
dan8ad1d8b2014-04-25 20:22:45 +00002293
danaa9933c2014-04-24 20:04:49 +00002294 /* Set rCostIdx to the cost of visiting selected rows in index. Add
2295 ** it to pNew->rRun, which is currently set to the cost of the index
2296 ** seek only. Then, if this is a non-covering index, add the cost of
2297 ** visiting the rows in the main table. */
2298 rCostIdx = pNew->nOut + 1 + (15*pProbe->szIdxRow)/pSrc->pTab->szTabRow;
dan8ad1d8b2014-04-25 20:22:45 +00002299 pNew->rRun = sqlite3LogEstAdd(rLogSize, rCostIdx);
drhe217efc2013-06-12 03:48:41 +00002300 if( (pNew->wsFlags & (WHERE_IDX_ONLY|WHERE_IPK))==0 ){
danaa9933c2014-04-24 20:04:49 +00002301 pNew->rRun = sqlite3LogEstAdd(pNew->rRun, pNew->nOut + 16);
drheb04de32013-05-10 15:16:30 +00002302 }
drhdbd94862014-07-23 23:57:42 +00002303 ApplyCostMultiplier(pNew->rRun, pProbe->pTable->costMult);
danaa9933c2014-04-24 20:04:49 +00002304
dan8ad1d8b2014-04-25 20:22:45 +00002305 nOutUnadjusted = pNew->nOut;
2306 pNew->rRun += nInMul + nIn;
2307 pNew->nOut += nInMul + nIn;
drhd8b77e22014-09-06 01:35:57 +00002308 whereLoopOutputAdjust(pBuilder->pWC, pNew, rSize);
drhcf8fa7a2013-05-10 20:26:22 +00002309 rc = whereLoopInsert(pBuilder, pNew);
dan440e6ff2014-04-28 08:49:54 +00002310
2311 if( pNew->wsFlags & WHERE_COLUMN_RANGE ){
2312 pNew->nOut = saved_nOut;
2313 }else{
2314 pNew->nOut = nOutUnadjusted;
2315 }
dan8ad1d8b2014-04-25 20:22:45 +00002316
drh5346e952013-05-08 14:14:26 +00002317 if( (pNew->wsFlags & WHERE_TOP_LIMIT)==0
dan39129ce2014-06-30 15:23:57 +00002318 && pNew->u.btree.nEq<pProbe->nColumn
drh5346e952013-05-08 14:14:26 +00002319 ){
drhb8a8e8a2013-06-10 19:12:39 +00002320 whereLoopAddBtreeIndex(pBuilder, pSrc, pProbe, nInMul+nIn);
drha18f3d22013-05-08 03:05:41 +00002321 }
danad45ed72013-08-08 12:21:32 +00002322 pNew->nOut = saved_nOut;
drh1435a9a2013-08-27 23:15:44 +00002323#ifdef SQLITE_ENABLE_STAT3_OR_STAT4
dan7a419232013-08-06 20:01:43 +00002324 pBuilder->nRecValid = nRecValid;
dan7a419232013-08-06 20:01:43 +00002325#endif
drh1c8148f2013-05-04 20:25:23 +00002326 }
drh4efc9292013-06-06 23:02:03 +00002327 pNew->prereq = saved_prereq;
2328 pNew->u.btree.nEq = saved_nEq;
drhc8bbce12014-10-21 01:05:09 +00002329 pNew->nSkip = saved_nSkip;
drh4efc9292013-06-06 23:02:03 +00002330 pNew->wsFlags = saved_wsFlags;
2331 pNew->nOut = saved_nOut;
2332 pNew->nLTerm = saved_nLTerm;
drhc8bbce12014-10-21 01:05:09 +00002333
2334 /* Consider using a skip-scan if there are no WHERE clause constraints
2335 ** available for the left-most terms of the index, and if the average
2336 ** number of repeats in the left-most terms is at least 18.
2337 **
2338 ** The magic number 18 is selected on the basis that scanning 17 rows
2339 ** is almost always quicker than an index seek (even though if the index
2340 ** contains fewer than 2^17 rows we assume otherwise in other parts of
2341 ** the code). And, even if it is not, it should not be too much slower.
2342 ** On the other hand, the extra seeks could end up being significantly
2343 ** more expensive. */
2344 assert( 42==sqlite3LogEst(18) );
2345 if( saved_nEq==saved_nSkip
2346 && saved_nEq+1<pProbe->nKeyCol
drhf9df2fb2014-11-15 19:08:13 +00002347 && pProbe->noSkipScan==0
drhc8bbce12014-10-21 01:05:09 +00002348 && pProbe->aiRowLogEst[saved_nEq+1]>=42 /* TUNING: Minimum for skip-scan */
2349 && (rc = whereLoopResize(db, pNew, pNew->nLTerm+1))==SQLITE_OK
2350 ){
2351 LogEst nIter;
2352 pNew->u.btree.nEq++;
2353 pNew->nSkip++;
2354 pNew->aLTerm[pNew->nLTerm++] = 0;
2355 pNew->wsFlags |= WHERE_SKIPSCAN;
2356 nIter = pProbe->aiRowLogEst[saved_nEq] - pProbe->aiRowLogEst[saved_nEq+1];
drhc8bbce12014-10-21 01:05:09 +00002357 pNew->nOut -= nIter;
2358 /* TUNING: Because uncertainties in the estimates for skip-scan queries,
2359 ** add a 1.375 fudge factor to make skip-scan slightly less likely. */
2360 nIter += 5;
2361 whereLoopAddBtreeIndex(pBuilder, pSrc, pProbe, nIter + nInMul);
2362 pNew->nOut = saved_nOut;
2363 pNew->u.btree.nEq = saved_nEq;
2364 pNew->nSkip = saved_nSkip;
2365 pNew->wsFlags = saved_wsFlags;
2366 }
2367
drh5346e952013-05-08 14:14:26 +00002368 return rc;
drh1c8148f2013-05-04 20:25:23 +00002369}
2370
2371/*
drh23f98da2013-05-21 15:52:07 +00002372** Return True if it is possible that pIndex might be useful in
2373** implementing the ORDER BY clause in pBuilder.
2374**
2375** Return False if pBuilder does not contain an ORDER BY clause or
2376** if there is no way for pIndex to be useful in implementing that
2377** ORDER BY clause.
2378*/
2379static int indexMightHelpWithOrderBy(
2380 WhereLoopBuilder *pBuilder,
2381 Index *pIndex,
2382 int iCursor
2383){
2384 ExprList *pOB;
drh6d381472013-06-13 17:58:08 +00002385 int ii, jj;
drh23f98da2013-05-21 15:52:07 +00002386
drh53cfbe92013-06-13 17:28:22 +00002387 if( pIndex->bUnordered ) return 0;
drh70d18342013-06-06 19:16:33 +00002388 if( (pOB = pBuilder->pWInfo->pOrderBy)==0 ) return 0;
drh23f98da2013-05-21 15:52:07 +00002389 for(ii=0; ii<pOB->nExpr; ii++){
drh45c154a2013-06-03 20:46:35 +00002390 Expr *pExpr = sqlite3ExprSkipCollate(pOB->a[ii].pExpr);
drh23f98da2013-05-21 15:52:07 +00002391 if( pExpr->op!=TK_COLUMN ) return 0;
2392 if( pExpr->iTable==iCursor ){
drh137fd4f2014-09-19 02:01:37 +00002393 if( pExpr->iColumn<0 ) return 1;
drhbbbdc832013-10-22 18:01:40 +00002394 for(jj=0; jj<pIndex->nKeyCol; jj++){
drh6d381472013-06-13 17:58:08 +00002395 if( pExpr->iColumn==pIndex->aiColumn[jj] ) return 1;
2396 }
drh23f98da2013-05-21 15:52:07 +00002397 }
2398 }
2399 return 0;
2400}
2401
2402/*
drh92a121f2013-06-10 12:15:47 +00002403** Return a bitmask where 1s indicate that the corresponding column of
2404** the table is used by an index. Only the first 63 columns are considered.
2405*/
drhfd5874d2013-06-12 14:52:39 +00002406static Bitmask columnsInIndex(Index *pIdx){
drh92a121f2013-06-10 12:15:47 +00002407 Bitmask m = 0;
2408 int j;
drhec95c442013-10-23 01:57:32 +00002409 for(j=pIdx->nColumn-1; j>=0; j--){
drh92a121f2013-06-10 12:15:47 +00002410 int x = pIdx->aiColumn[j];
drhec95c442013-10-23 01:57:32 +00002411 if( x>=0 ){
2412 testcase( x==BMS-1 );
2413 testcase( x==BMS-2 );
2414 if( x<BMS-1 ) m |= MASKBIT(x);
2415 }
drh92a121f2013-06-10 12:15:47 +00002416 }
2417 return m;
2418}
2419
drh4bd5f732013-07-31 23:22:39 +00002420/* Check to see if a partial index with pPartIndexWhere can be used
2421** in the current query. Return true if it can be and false if not.
2422*/
2423static int whereUsablePartialIndex(int iTab, WhereClause *pWC, Expr *pWhere){
2424 int i;
2425 WhereTerm *pTerm;
drhcf599b62015-08-07 20:57:00 +00002426 while( pWhere->op==TK_AND ){
2427 if( !whereUsablePartialIndex(iTab,pWC,pWhere->pLeft) ) return 0;
2428 pWhere = pWhere->pRight;
2429 }
drh4bd5f732013-07-31 23:22:39 +00002430 for(i=0, pTerm=pWC->a; i<pWC->nTerm; i++, pTerm++){
dan2a45cb52015-02-24 20:10:49 +00002431 Expr *pExpr = pTerm->pExpr;
2432 if( sqlite3ExprImpliesExpr(pExpr, pWhere, iTab)
2433 && (!ExprHasProperty(pExpr, EP_FromJoin) || pExpr->iRightJoinTable==iTab)
drh077f06e2015-02-24 16:48:59 +00002434 ){
2435 return 1;
2436 }
drh4bd5f732013-07-31 23:22:39 +00002437 }
2438 return 0;
2439}
drh92a121f2013-06-10 12:15:47 +00002440
2441/*
dan51576f42013-07-02 10:06:15 +00002442** Add all WhereLoop objects for a single table of the join where the table
drh0823c892013-05-11 00:06:23 +00002443** is idenfied by pBuilder->pNew->iTab. That table is guaranteed to be
2444** a b-tree table, not a virtual table.
dan81647222014-04-30 15:00:16 +00002445**
2446** The costs (WhereLoop.rRun) of the b-tree loops added by this function
2447** are calculated as follows:
2448**
2449** For a full scan, assuming the table (or index) contains nRow rows:
2450**
2451** cost = nRow * 3.0 // full-table scan
2452** cost = nRow * K // scan of covering index
2453** cost = nRow * (K+3.0) // scan of non-covering index
2454**
2455** where K is a value between 1.1 and 3.0 set based on the relative
2456** estimated average size of the index and table records.
2457**
2458** For an index scan, where nVisit is the number of index rows visited
2459** by the scan, and nSeek is the number of seek operations required on
2460** the index b-tree:
2461**
2462** cost = nSeek * (log(nRow) + K * nVisit) // covering index
2463** cost = nSeek * (log(nRow) + (K+3.0) * nVisit) // non-covering index
2464**
2465** Normally, nSeek is 1. nSeek values greater than 1 come about if the
2466** WHERE clause includes "x IN (....)" terms used in place of "x=?". Or when
2467** implicit "x IN (SELECT x FROM tbl)" terms are added for skip-scans.
drh83a305f2014-07-22 12:05:32 +00002468**
2469** The estimated values (nRow, nVisit, nSeek) often contain a large amount
2470** of uncertainty. For this reason, scoring is designed to pick plans that
2471** "do the least harm" if the estimates are inaccurate. For example, a
2472** log(nRow) factor is omitted from a non-covering index scan in order to
2473** bias the scoring in favor of using an index, since the worst-case
2474** performance of using an index is far better than the worst-case performance
2475** of a full table scan.
drhf1b5f5b2013-05-02 00:15:01 +00002476*/
drh5346e952013-05-08 14:14:26 +00002477static int whereLoopAddBtree(
drh1c8148f2013-05-04 20:25:23 +00002478 WhereLoopBuilder *pBuilder, /* WHERE clause information */
drh1c8148f2013-05-04 20:25:23 +00002479 Bitmask mExtra /* Extra prerequesites for using this table */
drhf1b5f5b2013-05-02 00:15:01 +00002480){
drh70d18342013-06-06 19:16:33 +00002481 WhereInfo *pWInfo; /* WHERE analysis context */
drh1c8148f2013-05-04 20:25:23 +00002482 Index *pProbe; /* An index we are evaluating */
drh1c8148f2013-05-04 20:25:23 +00002483 Index sPk; /* A fake index object for the primary key */
dancfc9df72014-04-25 15:01:01 +00002484 LogEst aiRowEstPk[2]; /* The aiRowLogEst[] value for the sPk index */
drhbbbdc832013-10-22 18:01:40 +00002485 i16 aiColumnPk = -1; /* The aColumn[] value for the sPk index */
drh70d18342013-06-06 19:16:33 +00002486 SrcList *pTabList; /* The FROM clause */
drh1c8148f2013-05-04 20:25:23 +00002487 struct SrcList_item *pSrc; /* The FROM clause btree term to add */
drh1c8148f2013-05-04 20:25:23 +00002488 WhereLoop *pNew; /* Template WhereLoop object */
drh5346e952013-05-08 14:14:26 +00002489 int rc = SQLITE_OK; /* Return code */
drhd044d202013-05-31 12:43:55 +00002490 int iSortIdx = 1; /* Index number */
drh23f98da2013-05-21 15:52:07 +00002491 int b; /* A boolean value */
drhbf539c42013-10-05 18:16:02 +00002492 LogEst rSize; /* number of rows in the table */
2493 LogEst rLogSize; /* Logarithm of the number of rows in the table */
drh4bd5f732013-07-31 23:22:39 +00002494 WhereClause *pWC; /* The parsed WHERE clause */
drh3495d202013-10-07 17:32:15 +00002495 Table *pTab; /* Table being queried */
drh23f98da2013-05-21 15:52:07 +00002496
drh1c8148f2013-05-04 20:25:23 +00002497 pNew = pBuilder->pNew;
drh70d18342013-06-06 19:16:33 +00002498 pWInfo = pBuilder->pWInfo;
2499 pTabList = pWInfo->pTabList;
2500 pSrc = pTabList->a + pNew->iTab;
drh3495d202013-10-07 17:32:15 +00002501 pTab = pSrc->pTab;
drh4bd5f732013-07-31 23:22:39 +00002502 pWC = pBuilder->pWC;
drh0823c892013-05-11 00:06:23 +00002503 assert( !IsVirtual(pSrc->pTab) );
drh1c8148f2013-05-04 20:25:23 +00002504
drh8a48b9c2015-08-19 15:20:00 +00002505 if( pSrc->pIBIndex ){
drh1c8148f2013-05-04 20:25:23 +00002506 /* An INDEXED BY clause specifies a particular index to use */
drh8a48b9c2015-08-19 15:20:00 +00002507 pProbe = pSrc->pIBIndex;
drhec95c442013-10-23 01:57:32 +00002508 }else if( !HasRowid(pTab) ){
2509 pProbe = pTab->pIndex;
drh1c8148f2013-05-04 20:25:23 +00002510 }else{
2511 /* There is no INDEXED BY clause. Create a fake Index object in local
2512 ** variable sPk to represent the rowid primary key index. Make this
2513 ** fake index the first in a chain of Index objects with all of the real
2514 ** indices to follow */
2515 Index *pFirst; /* First of real indices on the table */
2516 memset(&sPk, 0, sizeof(Index));
drhbbbdc832013-10-22 18:01:40 +00002517 sPk.nKeyCol = 1;
dan39129ce2014-06-30 15:23:57 +00002518 sPk.nColumn = 1;
drh1c8148f2013-05-04 20:25:23 +00002519 sPk.aiColumn = &aiColumnPk;
dancfc9df72014-04-25 15:01:01 +00002520 sPk.aiRowLogEst = aiRowEstPk;
drh1c8148f2013-05-04 20:25:23 +00002521 sPk.onError = OE_Replace;
drh3495d202013-10-07 17:32:15 +00002522 sPk.pTable = pTab;
danaa9933c2014-04-24 20:04:49 +00002523 sPk.szIdxRow = pTab->szTabRow;
dancfc9df72014-04-25 15:01:01 +00002524 aiRowEstPk[0] = pTab->nRowLogEst;
2525 aiRowEstPk[1] = 0;
drh1c8148f2013-05-04 20:25:23 +00002526 pFirst = pSrc->pTab->pIndex;
drh8a48b9c2015-08-19 15:20:00 +00002527 if( pSrc->fg.notIndexed==0 ){
drh1c8148f2013-05-04 20:25:23 +00002528 /* The real indices of the table are only considered if the
2529 ** NOT INDEXED qualifier is omitted from the FROM clause */
2530 sPk.pNext = pFirst;
2531 }
2532 pProbe = &sPk;
2533 }
dancfc9df72014-04-25 15:01:01 +00002534 rSize = pTab->nRowLogEst;
drheb04de32013-05-10 15:16:30 +00002535 rLogSize = estLog(rSize);
2536
drhfeb56e02013-08-23 17:33:46 +00002537#ifndef SQLITE_OMIT_AUTOMATIC_INDEX
drheb04de32013-05-10 15:16:30 +00002538 /* Automatic indexes */
drh8a48b9c2015-08-19 15:20:00 +00002539 if( !pBuilder->pOrSet /* Not part of an OR optimization */
drh8e8e7ef2015-03-02 17:25:00 +00002540 && (pWInfo->wctrlFlags & WHERE_NO_AUTOINDEX)==0
drh4fe425a2013-06-12 17:08:06 +00002541 && (pWInfo->pParse->db->flags & SQLITE_AutoIndex)!=0
drh8a48b9c2015-08-19 15:20:00 +00002542 && pSrc->pIBIndex==0 /* Has no INDEXED BY clause */
2543 && !pSrc->fg.notIndexed /* Has no NOT INDEXED clause */
2544 && HasRowid(pTab) /* Is not a WITHOUT ROWID table. (FIXME: Why not?) */
2545 && !pSrc->fg.isCorrelated /* Not a correlated subquery */
2546 && !pSrc->fg.isRecursive /* Not a recursive common table expression. */
drheb04de32013-05-10 15:16:30 +00002547 ){
2548 /* Generate auto-index WhereLoops */
drheb04de32013-05-10 15:16:30 +00002549 WhereTerm *pTerm;
2550 WhereTerm *pWCEnd = pWC->a + pWC->nTerm;
2551 for(pTerm=pWC->a; rc==SQLITE_OK && pTerm<pWCEnd; pTerm++){
drh79a13bf2013-05-31 20:28:28 +00002552 if( pTerm->prereqRight & pNew->maskSelf ) continue;
drheb04de32013-05-10 15:16:30 +00002553 if( termCanDriveIndex(pTerm, pSrc, 0) ){
2554 pNew->u.btree.nEq = 1;
drhc8bbce12014-10-21 01:05:09 +00002555 pNew->nSkip = 0;
drhef866372013-05-22 20:49:02 +00002556 pNew->u.btree.pIndex = 0;
drh4efc9292013-06-06 23:02:03 +00002557 pNew->nLTerm = 1;
2558 pNew->aLTerm[0] = pTerm;
drhe1e2e9a2013-06-13 15:16:53 +00002559 /* TUNING: One-time cost for computing the automatic index is
drh7e074332014-09-22 14:30:51 +00002560 ** estimated to be X*N*log2(N) where N is the number of rows in
2561 ** the table being indexed and where X is 7 (LogEst=28) for normal
2562 ** tables or 1.375 (LogEst=4) for views and subqueries. The value
2563 ** of X is smaller for views and subqueries so that the query planner
2564 ** will be more aggressive about generating automatic indexes for
2565 ** those objects, since there is no opportunity to add schema
2566 ** indexes on subqueries and views. */
2567 pNew->rSetup = rLogSize + rSize + 4;
2568 if( pTab->pSelect==0 && (pTab->tabFlags & TF_Ephemeral)==0 ){
2569 pNew->rSetup += 24;
2570 }
drhdbd94862014-07-23 23:57:42 +00002571 ApplyCostMultiplier(pNew->rSetup, pTab->costMult);
drh986b3872013-06-28 21:12:20 +00002572 /* TUNING: Each index lookup yields 20 rows in the table. This
2573 ** is more than the usual guess of 10 rows, since we have no way
peter.d.reid60ec9142014-09-06 16:39:46 +00002574 ** of knowing how selective the index will ultimately be. It would
drh986b3872013-06-28 21:12:20 +00002575 ** not be unreasonable to make this value much larger. */
drhbf539c42013-10-05 18:16:02 +00002576 pNew->nOut = 43; assert( 43==sqlite3LogEst(20) );
drhb50596d2013-10-08 20:42:41 +00002577 pNew->rRun = sqlite3LogEstAdd(rLogSize,pNew->nOut);
drh986b3872013-06-28 21:12:20 +00002578 pNew->wsFlags = WHERE_AUTO_INDEX;
drheb04de32013-05-10 15:16:30 +00002579 pNew->prereq = mExtra | pTerm->prereqRight;
drhcf8fa7a2013-05-10 20:26:22 +00002580 rc = whereLoopInsert(pBuilder, pNew);
drheb04de32013-05-10 15:16:30 +00002581 }
2582 }
2583 }
drhfeb56e02013-08-23 17:33:46 +00002584#endif /* SQLITE_OMIT_AUTOMATIC_INDEX */
drh1c8148f2013-05-04 20:25:23 +00002585
2586 /* Loop over all indices
2587 */
drh23f98da2013-05-21 15:52:07 +00002588 for(; rc==SQLITE_OK && pProbe; pProbe=pProbe->pNext, iSortIdx++){
drh4bd5f732013-07-31 23:22:39 +00002589 if( pProbe->pPartIdxWhere!=0
dan08291692014-08-27 17:37:20 +00002590 && !whereUsablePartialIndex(pSrc->iCursor, pWC, pProbe->pPartIdxWhere) ){
2591 testcase( pNew->iTab!=pSrc->iCursor ); /* See ticket [98d973b8f5] */
drh4bd5f732013-07-31 23:22:39 +00002592 continue; /* Partial index inappropriate for this query */
2593 }
dan7de2a1f2014-04-28 20:11:20 +00002594 rSize = pProbe->aiRowLogEst[0];
drh5346e952013-05-08 14:14:26 +00002595 pNew->u.btree.nEq = 0;
drhc8bbce12014-10-21 01:05:09 +00002596 pNew->nSkip = 0;
drh4efc9292013-06-06 23:02:03 +00002597 pNew->nLTerm = 0;
drh23f98da2013-05-21 15:52:07 +00002598 pNew->iSortIdx = 0;
drhb8a8e8a2013-06-10 19:12:39 +00002599 pNew->rSetup = 0;
drh23f98da2013-05-21 15:52:07 +00002600 pNew->prereq = mExtra;
drh74f91d42013-06-19 18:01:44 +00002601 pNew->nOut = rSize;
drh23f98da2013-05-21 15:52:07 +00002602 pNew->u.btree.pIndex = pProbe;
2603 b = indexMightHelpWithOrderBy(pBuilder, pProbe, pSrc->iCursor);
drh53cfbe92013-06-13 17:28:22 +00002604 /* The ONEPASS_DESIRED flags never occurs together with ORDER BY */
2605 assert( (pWInfo->wctrlFlags & WHERE_ONEPASS_DESIRED)==0 || b==0 );
drh43fe25f2013-05-07 23:06:23 +00002606 if( pProbe->tnum<=0 ){
2607 /* Integer primary key index */
2608 pNew->wsFlags = WHERE_IPK;
drh23f98da2013-05-21 15:52:07 +00002609
2610 /* Full table scan */
drhd044d202013-05-31 12:43:55 +00002611 pNew->iSortIdx = b ? iSortIdx : 0;
danaa9933c2014-04-24 20:04:49 +00002612 /* TUNING: Cost of full table scan is (N*3.0). */
2613 pNew->rRun = rSize + 16;
drhdbd94862014-07-23 23:57:42 +00002614 ApplyCostMultiplier(pNew->rRun, pTab->costMult);
drhd8b77e22014-09-06 01:35:57 +00002615 whereLoopOutputAdjust(pWC, pNew, rSize);
drh23f98da2013-05-21 15:52:07 +00002616 rc = whereLoopInsert(pBuilder, pNew);
drhcca9f3d2013-09-06 15:23:29 +00002617 pNew->nOut = rSize;
drh23f98da2013-05-21 15:52:07 +00002618 if( rc ) break;
drh43fe25f2013-05-07 23:06:23 +00002619 }else{
drhec95c442013-10-23 01:57:32 +00002620 Bitmask m;
2621 if( pProbe->isCovering ){
2622 pNew->wsFlags = WHERE_IDX_ONLY | WHERE_INDEXED;
2623 m = 0;
2624 }else{
2625 m = pSrc->colUsed & ~columnsInIndex(pProbe);
2626 pNew->wsFlags = (m==0) ? (WHERE_IDX_ONLY|WHERE_INDEXED) : WHERE_INDEXED;
2627 }
drh1c8148f2013-05-04 20:25:23 +00002628
drh23f98da2013-05-21 15:52:07 +00002629 /* Full scan via index */
drh53cfbe92013-06-13 17:28:22 +00002630 if( b
drh702ba9f2013-11-07 21:25:13 +00002631 || !HasRowid(pTab)
drh53cfbe92013-06-13 17:28:22 +00002632 || ( m==0
2633 && pProbe->bUnordered==0
drh702ba9f2013-11-07 21:25:13 +00002634 && (pProbe->szIdxRow<pTab->szTabRow)
drh53cfbe92013-06-13 17:28:22 +00002635 && (pWInfo->wctrlFlags & WHERE_ONEPASS_DESIRED)==0
2636 && sqlite3GlobalConfig.bUseCis
2637 && OptimizationEnabled(pWInfo->pParse->db, SQLITE_CoverIdxScan)
2638 )
drhe3b7c922013-06-03 19:17:40 +00002639 ){
drh23f98da2013-05-21 15:52:07 +00002640 pNew->iSortIdx = b ? iSortIdx : 0;
danaa9933c2014-04-24 20:04:49 +00002641
2642 /* The cost of visiting the index rows is N*K, where K is
2643 ** between 1.1 and 3.0, depending on the relative sizes of the
2644 ** index and table rows. If this is a non-covering index scan,
2645 ** also add the cost of visiting table rows (N*3.0). */
2646 pNew->rRun = rSize + 1 + (15*pProbe->szIdxRow)/pTab->szTabRow;
2647 if( m!=0 ){
2648 pNew->rRun = sqlite3LogEstAdd(pNew->rRun, rSize+16);
drhe1e2e9a2013-06-13 15:16:53 +00002649 }
drhdbd94862014-07-23 23:57:42 +00002650 ApplyCostMultiplier(pNew->rRun, pTab->costMult);
drhd8b77e22014-09-06 01:35:57 +00002651 whereLoopOutputAdjust(pWC, pNew, rSize);
drh23f98da2013-05-21 15:52:07 +00002652 rc = whereLoopInsert(pBuilder, pNew);
drhcca9f3d2013-09-06 15:23:29 +00002653 pNew->nOut = rSize;
drh23f98da2013-05-21 15:52:07 +00002654 if( rc ) break;
2655 }
2656 }
dan7a419232013-08-06 20:01:43 +00002657
drhb8a8e8a2013-06-10 19:12:39 +00002658 rc = whereLoopAddBtreeIndex(pBuilder, pSrc, pProbe, 0);
drh1435a9a2013-08-27 23:15:44 +00002659#ifdef SQLITE_ENABLE_STAT3_OR_STAT4
dan87cd9322013-08-07 15:52:41 +00002660 sqlite3Stat4ProbeFree(pBuilder->pRec);
2661 pBuilder->nRecValid = 0;
2662 pBuilder->pRec = 0;
danddc2d6e2013-08-06 20:15:06 +00002663#endif
drh1c8148f2013-05-04 20:25:23 +00002664
2665 /* If there was an INDEXED BY clause, then only that one index is
2666 ** considered. */
drh8a48b9c2015-08-19 15:20:00 +00002667 if( pSrc->pIBIndex ) break;
drh1c8148f2013-05-04 20:25:23 +00002668 }
drh5346e952013-05-08 14:14:26 +00002669 return rc;
drhf1b5f5b2013-05-02 00:15:01 +00002670}
2671
drh8636e9c2013-06-11 01:50:08 +00002672#ifndef SQLITE_OMIT_VIRTUALTABLE
drhf1b5f5b2013-05-02 00:15:01 +00002673/*
drh0823c892013-05-11 00:06:23 +00002674** Add all WhereLoop objects for a table of the join identified by
2675** pBuilder->pNew->iTab. That table is guaranteed to be a virtual table.
dan4f20cd42015-06-08 18:05:54 +00002676**
2677** If there are no LEFT or CROSS JOIN joins in the query, both mExtra and
2678** mUnusable are set to 0. Otherwise, mExtra is a mask of all FROM clause
2679** entries that occur before the virtual table in the FROM clause and are
2680** separated from it by at least one LEFT or CROSS JOIN. Similarly, the
2681** mUnusable mask contains all FROM clause entries that occur after the
2682** virtual table and are separated from it by at least one LEFT or
2683** CROSS JOIN.
2684**
2685** For example, if the query were:
2686**
2687** ... FROM t1, t2 LEFT JOIN t3, t4, vt CROSS JOIN t5, t6;
2688**
2689** then mExtra corresponds to (t1, t2) and mUnusable to (t5, t6).
2690**
2691** All the tables in mExtra must be scanned before the current virtual
2692** table. So any terms for which all prerequisites are satisfied by
2693** mExtra may be specified as "usable" in all calls to xBestIndex.
2694** Conversely, all tables in mUnusable must be scanned after the current
2695** virtual table, so any terms for which the prerequisites overlap with
2696** mUnusable should always be configured as "not-usable" for xBestIndex.
drhf1b5f5b2013-05-02 00:15:01 +00002697*/
drh5346e952013-05-08 14:14:26 +00002698static int whereLoopAddVirtual(
danff4b23b2013-11-12 12:17:16 +00002699 WhereLoopBuilder *pBuilder, /* WHERE clause information */
dan4f20cd42015-06-08 18:05:54 +00002700 Bitmask mExtra, /* Tables that must be scanned before this one */
2701 Bitmask mUnusable /* Tables that must be scanned after this one */
drhf1b5f5b2013-05-02 00:15:01 +00002702){
drh70d18342013-06-06 19:16:33 +00002703 WhereInfo *pWInfo; /* WHERE analysis context */
drh5346e952013-05-08 14:14:26 +00002704 Parse *pParse; /* The parsing context */
2705 WhereClause *pWC; /* The WHERE clause */
2706 struct SrcList_item *pSrc; /* The FROM clause term to search */
2707 Table *pTab;
2708 sqlite3 *db;
2709 sqlite3_index_info *pIdxInfo;
2710 struct sqlite3_index_constraint *pIdxCons;
2711 struct sqlite3_index_constraint_usage *pUsage;
2712 WhereTerm *pTerm;
2713 int i, j;
2714 int iTerm, mxTerm;
drh4efc9292013-06-06 23:02:03 +00002715 int nConstraint;
drh5346e952013-05-08 14:14:26 +00002716 int seenIn = 0; /* True if an IN operator is seen */
2717 int seenVar = 0; /* True if a non-constant constraint is seen */
2718 int iPhase; /* 0: const w/o IN, 1: const, 2: no IN, 2: IN */
2719 WhereLoop *pNew;
drh5346e952013-05-08 14:14:26 +00002720 int rc = SQLITE_OK;
2721
dan4f20cd42015-06-08 18:05:54 +00002722 assert( (mExtra & mUnusable)==0 );
drh70d18342013-06-06 19:16:33 +00002723 pWInfo = pBuilder->pWInfo;
2724 pParse = pWInfo->pParse;
drh5346e952013-05-08 14:14:26 +00002725 db = pParse->db;
2726 pWC = pBuilder->pWC;
drh5346e952013-05-08 14:14:26 +00002727 pNew = pBuilder->pNew;
drh70d18342013-06-06 19:16:33 +00002728 pSrc = &pWInfo->pTabList->a[pNew->iTab];
drhb2a90f02013-05-10 03:30:49 +00002729 pTab = pSrc->pTab;
drh0823c892013-05-11 00:06:23 +00002730 assert( IsVirtual(pTab) );
dan4f20cd42015-06-08 18:05:54 +00002731 pIdxInfo = allocateIndexInfo(pParse, pWC, mUnusable, pSrc,pBuilder->pOrderBy);
drh5346e952013-05-08 14:14:26 +00002732 if( pIdxInfo==0 ) return SQLITE_NOMEM;
drh5346e952013-05-08 14:14:26 +00002733 pNew->prereq = 0;
drh5346e952013-05-08 14:14:26 +00002734 pNew->rSetup = 0;
2735 pNew->wsFlags = WHERE_VIRTUALTABLE;
drh4efc9292013-06-06 23:02:03 +00002736 pNew->nLTerm = 0;
drh5346e952013-05-08 14:14:26 +00002737 pNew->u.vtab.needFree = 0;
2738 pUsage = pIdxInfo->aConstraintUsage;
drh4efc9292013-06-06 23:02:03 +00002739 nConstraint = pIdxInfo->nConstraint;
drh7963b0e2013-06-17 21:37:40 +00002740 if( whereLoopResize(db, pNew, nConstraint) ){
2741 sqlite3DbFree(db, pIdxInfo);
2742 return SQLITE_NOMEM;
2743 }
drh5346e952013-05-08 14:14:26 +00002744
drh0823c892013-05-11 00:06:23 +00002745 for(iPhase=0; iPhase<=3; iPhase++){
drh5346e952013-05-08 14:14:26 +00002746 if( !seenIn && (iPhase&1)!=0 ){
2747 iPhase++;
2748 if( iPhase>3 ) break;
2749 }
2750 if( !seenVar && iPhase>1 ) break;
2751 pIdxCons = *(struct sqlite3_index_constraint**)&pIdxInfo->aConstraint;
2752 for(i=0; i<pIdxInfo->nConstraint; i++, pIdxCons++){
2753 j = pIdxCons->iTermOffset;
2754 pTerm = &pWC->a[j];
2755 switch( iPhase ){
2756 case 0: /* Constants without IN operator */
2757 pIdxCons->usable = 0;
2758 if( (pTerm->eOperator & WO_IN)!=0 ){
2759 seenIn = 1;
drh7963b0e2013-06-17 21:37:40 +00002760 }
dan4f20cd42015-06-08 18:05:54 +00002761 if( (pTerm->prereqRight & ~mExtra)!=0 ){
drh5346e952013-05-08 14:14:26 +00002762 seenVar = 1;
drh7963b0e2013-06-17 21:37:40 +00002763 }else if( (pTerm->eOperator & WO_IN)==0 ){
drh5346e952013-05-08 14:14:26 +00002764 pIdxCons->usable = 1;
2765 }
2766 break;
2767 case 1: /* Constants with IN operators */
2768 assert( seenIn );
dan4f20cd42015-06-08 18:05:54 +00002769 pIdxCons->usable = (pTerm->prereqRight & ~mExtra)==0;
drh5346e952013-05-08 14:14:26 +00002770 break;
2771 case 2: /* Variables without IN */
2772 assert( seenVar );
2773 pIdxCons->usable = (pTerm->eOperator & WO_IN)==0;
2774 break;
2775 default: /* Variables with IN */
2776 assert( seenVar && seenIn );
2777 pIdxCons->usable = 1;
2778 break;
2779 }
2780 }
2781 memset(pUsage, 0, sizeof(pUsage[0])*pIdxInfo->nConstraint);
2782 if( pIdxInfo->needToFreeIdxStr ) sqlite3_free(pIdxInfo->idxStr);
2783 pIdxInfo->idxStr = 0;
2784 pIdxInfo->idxNum = 0;
2785 pIdxInfo->needToFreeIdxStr = 0;
2786 pIdxInfo->orderByConsumed = 0;
drh8636e9c2013-06-11 01:50:08 +00002787 pIdxInfo->estimatedCost = SQLITE_BIG_DBL / (double)2;
dana9f58152013-11-11 19:01:33 +00002788 pIdxInfo->estimatedRows = 25;
drh5346e952013-05-08 14:14:26 +00002789 rc = vtabBestIndex(pParse, pTab, pIdxInfo);
2790 if( rc ) goto whereLoopAddVtab_exit;
2791 pIdxCons = *(struct sqlite3_index_constraint**)&pIdxInfo->aConstraint;
danff4b23b2013-11-12 12:17:16 +00002792 pNew->prereq = mExtra;
drhc718f1c2013-05-08 20:05:58 +00002793 mxTerm = -1;
drh4efc9292013-06-06 23:02:03 +00002794 assert( pNew->nLSlot>=nConstraint );
2795 for(i=0; i<nConstraint; i++) pNew->aLTerm[i] = 0;
drh3bd26f02013-05-24 14:52:03 +00002796 pNew->u.vtab.omitMask = 0;
drh4efc9292013-06-06 23:02:03 +00002797 for(i=0; i<nConstraint; i++, pIdxCons++){
drh5346e952013-05-08 14:14:26 +00002798 if( (iTerm = pUsage[i].argvIndex - 1)>=0 ){
2799 j = pIdxCons->iTermOffset;
drh4efc9292013-06-06 23:02:03 +00002800 if( iTerm>=nConstraint
drh5346e952013-05-08 14:14:26 +00002801 || j<0
2802 || j>=pWC->nTerm
drh4efc9292013-06-06 23:02:03 +00002803 || pNew->aLTerm[iTerm]!=0
drh5346e952013-05-08 14:14:26 +00002804 ){
2805 rc = SQLITE_ERROR;
2806 sqlite3ErrorMsg(pParse, "%s.xBestIndex() malfunction", pTab->zName);
2807 goto whereLoopAddVtab_exit;
2808 }
drh7963b0e2013-06-17 21:37:40 +00002809 testcase( iTerm==nConstraint-1 );
2810 testcase( j==0 );
2811 testcase( j==pWC->nTerm-1 );
drh5346e952013-05-08 14:14:26 +00002812 pTerm = &pWC->a[j];
2813 pNew->prereq |= pTerm->prereqRight;
drh4efc9292013-06-06 23:02:03 +00002814 assert( iTerm<pNew->nLSlot );
2815 pNew->aLTerm[iTerm] = pTerm;
drh5346e952013-05-08 14:14:26 +00002816 if( iTerm>mxTerm ) mxTerm = iTerm;
drh7963b0e2013-06-17 21:37:40 +00002817 testcase( iTerm==15 );
2818 testcase( iTerm==16 );
drh52986302013-06-03 16:03:16 +00002819 if( iTerm<16 && pUsage[i].omit ) pNew->u.vtab.omitMask |= 1<<iTerm;
drh5346e952013-05-08 14:14:26 +00002820 if( (pTerm->eOperator & WO_IN)!=0 ){
2821 if( pUsage[i].omit==0 ){
2822 /* Do not attempt to use an IN constraint if the virtual table
2823 ** says that the equivalent EQ constraint cannot be safely omitted.
2824 ** If we do attempt to use such a constraint, some rows might be
2825 ** repeated in the output. */
2826 break;
2827 }
2828 /* A virtual table that is constrained by an IN clause may not
2829 ** consume the ORDER BY clause because (1) the order of IN terms
2830 ** is not necessarily related to the order of output terms and
2831 ** (2) Multiple outputs from a single IN value will not merge
2832 ** together. */
2833 pIdxInfo->orderByConsumed = 0;
2834 }
2835 }
2836 }
drh4efc9292013-06-06 23:02:03 +00002837 if( i>=nConstraint ){
2838 pNew->nLTerm = mxTerm+1;
2839 assert( pNew->nLTerm<=pNew->nLSlot );
drh5346e952013-05-08 14:14:26 +00002840 pNew->u.vtab.idxNum = pIdxInfo->idxNum;
2841 pNew->u.vtab.needFree = pIdxInfo->needToFreeIdxStr;
2842 pIdxInfo->needToFreeIdxStr = 0;
2843 pNew->u.vtab.idxStr = pIdxInfo->idxStr;
drh0401ace2014-03-18 15:30:27 +00002844 pNew->u.vtab.isOrdered = (i8)(pIdxInfo->orderByConsumed ?
2845 pIdxInfo->nOrderBy : 0);
drhb8a8e8a2013-06-10 19:12:39 +00002846 pNew->rSetup = 0;
drhb50596d2013-10-08 20:42:41 +00002847 pNew->rRun = sqlite3LogEstFromDouble(pIdxInfo->estimatedCost);
dana9f58152013-11-11 19:01:33 +00002848 pNew->nOut = sqlite3LogEst(pIdxInfo->estimatedRows);
drhcf8fa7a2013-05-10 20:26:22 +00002849 whereLoopInsert(pBuilder, pNew);
drh5346e952013-05-08 14:14:26 +00002850 if( pNew->u.vtab.needFree ){
2851 sqlite3_free(pNew->u.vtab.idxStr);
2852 pNew->u.vtab.needFree = 0;
2853 }
2854 }
2855 }
2856
2857whereLoopAddVtab_exit:
2858 if( pIdxInfo->needToFreeIdxStr ) sqlite3_free(pIdxInfo->idxStr);
2859 sqlite3DbFree(db, pIdxInfo);
2860 return rc;
drhf1b5f5b2013-05-02 00:15:01 +00002861}
drh8636e9c2013-06-11 01:50:08 +00002862#endif /* SQLITE_OMIT_VIRTUALTABLE */
drhf1b5f5b2013-05-02 00:15:01 +00002863
2864/*
drhcf8fa7a2013-05-10 20:26:22 +00002865** Add WhereLoop entries to handle OR terms. This works for either
2866** btrees or virtual tables.
2867*/
dan4f20cd42015-06-08 18:05:54 +00002868static int whereLoopAddOr(
2869 WhereLoopBuilder *pBuilder,
2870 Bitmask mExtra,
2871 Bitmask mUnusable
2872){
drh70d18342013-06-06 19:16:33 +00002873 WhereInfo *pWInfo = pBuilder->pWInfo;
drhcf8fa7a2013-05-10 20:26:22 +00002874 WhereClause *pWC;
2875 WhereLoop *pNew;
2876 WhereTerm *pTerm, *pWCEnd;
2877 int rc = SQLITE_OK;
2878 int iCur;
2879 WhereClause tempWC;
2880 WhereLoopBuilder sSubBuild;
dan5da73e12014-04-30 18:11:55 +00002881 WhereOrSet sSum, sCur;
drhcf8fa7a2013-05-10 20:26:22 +00002882 struct SrcList_item *pItem;
2883
drhcf8fa7a2013-05-10 20:26:22 +00002884 pWC = pBuilder->pWC;
drhcf8fa7a2013-05-10 20:26:22 +00002885 pWCEnd = pWC->a + pWC->nTerm;
2886 pNew = pBuilder->pNew;
drh77dfd5b2013-08-19 11:15:48 +00002887 memset(&sSum, 0, sizeof(sSum));
drh186ad8c2013-10-08 18:40:37 +00002888 pItem = pWInfo->pTabList->a + pNew->iTab;
2889 iCur = pItem->iCursor;
drhcf8fa7a2013-05-10 20:26:22 +00002890
2891 for(pTerm=pWC->a; pTerm<pWCEnd && rc==SQLITE_OK; pTerm++){
2892 if( (pTerm->eOperator & WO_OR)!=0
2893 && (pTerm->u.pOrInfo->indexable & pNew->maskSelf)!=0
2894 ){
2895 WhereClause * const pOrWC = &pTerm->u.pOrInfo->wc;
2896 WhereTerm * const pOrWCEnd = &pOrWC->a[pOrWC->nTerm];
2897 WhereTerm *pOrTerm;
drhaa32e3c2013-07-16 21:31:23 +00002898 int once = 1;
2899 int i, j;
drh783dece2013-06-05 17:53:43 +00002900
drh783dece2013-06-05 17:53:43 +00002901 sSubBuild = *pBuilder;
2902 sSubBuild.pOrderBy = 0;
drhaa32e3c2013-07-16 21:31:23 +00002903 sSubBuild.pOrSet = &sCur;
drhcf8fa7a2013-05-10 20:26:22 +00002904
drh0a99ba32014-09-30 17:03:35 +00002905 WHERETRACE(0x200, ("Begin processing OR-clause %p\n", pTerm));
drhc7f0d222013-06-19 03:27:12 +00002906 for(pOrTerm=pOrWC->a; pOrTerm<pOrWCEnd; pOrTerm++){
drh783dece2013-06-05 17:53:43 +00002907 if( (pOrTerm->eOperator & WO_AND)!=0 ){
drhcf8fa7a2013-05-10 20:26:22 +00002908 sSubBuild.pWC = &pOrTerm->u.pAndInfo->wc;
2909 }else if( pOrTerm->leftCursor==iCur ){
drh70d18342013-06-06 19:16:33 +00002910 tempWC.pWInfo = pWC->pWInfo;
drh783dece2013-06-05 17:53:43 +00002911 tempWC.pOuter = pWC;
2912 tempWC.op = TK_AND;
drh783dece2013-06-05 17:53:43 +00002913 tempWC.nTerm = 1;
drhcf8fa7a2013-05-10 20:26:22 +00002914 tempWC.a = pOrTerm;
2915 sSubBuild.pWC = &tempWC;
2916 }else{
2917 continue;
2918 }
drhaa32e3c2013-07-16 21:31:23 +00002919 sCur.n = 0;
drh52651492014-09-30 14:14:19 +00002920#ifdef WHERETRACE_ENABLED
drh0a99ba32014-09-30 17:03:35 +00002921 WHERETRACE(0x200, ("OR-term %d of %p has %d subterms:\n",
2922 (int)(pOrTerm-pOrWC->a), pTerm, sSubBuild.pWC->nTerm));
2923 if( sqlite3WhereTrace & 0x400 ){
2924 for(i=0; i<sSubBuild.pWC->nTerm; i++){
2925 whereTermPrint(&sSubBuild.pWC->a[i], i);
2926 }
drh52651492014-09-30 14:14:19 +00002927 }
2928#endif
drh8636e9c2013-06-11 01:50:08 +00002929#ifndef SQLITE_OMIT_VIRTUALTABLE
drhcf8fa7a2013-05-10 20:26:22 +00002930 if( IsVirtual(pItem->pTab) ){
dan4f20cd42015-06-08 18:05:54 +00002931 rc = whereLoopAddVirtual(&sSubBuild, mExtra, mUnusable);
drh8636e9c2013-06-11 01:50:08 +00002932 }else
2933#endif
2934 {
drhcf8fa7a2013-05-10 20:26:22 +00002935 rc = whereLoopAddBtree(&sSubBuild, mExtra);
2936 }
drh36be4c42014-09-30 17:31:23 +00002937 if( rc==SQLITE_OK ){
dan4f20cd42015-06-08 18:05:54 +00002938 rc = whereLoopAddOr(&sSubBuild, mExtra, mUnusable);
drh36be4c42014-09-30 17:31:23 +00002939 }
drhaa32e3c2013-07-16 21:31:23 +00002940 assert( rc==SQLITE_OK || sCur.n==0 );
2941 if( sCur.n==0 ){
2942 sSum.n = 0;
2943 break;
2944 }else if( once ){
2945 whereOrMove(&sSum, &sCur);
2946 once = 0;
2947 }else{
dan5da73e12014-04-30 18:11:55 +00002948 WhereOrSet sPrev;
drhaa32e3c2013-07-16 21:31:23 +00002949 whereOrMove(&sPrev, &sSum);
2950 sSum.n = 0;
2951 for(i=0; i<sPrev.n; i++){
2952 for(j=0; j<sCur.n; j++){
2953 whereOrInsert(&sSum, sPrev.a[i].prereq | sCur.a[j].prereq,
drhbf539c42013-10-05 18:16:02 +00002954 sqlite3LogEstAdd(sPrev.a[i].rRun, sCur.a[j].rRun),
2955 sqlite3LogEstAdd(sPrev.a[i].nOut, sCur.a[j].nOut));
drhaa32e3c2013-07-16 21:31:23 +00002956 }
2957 }
2958 }
drhcf8fa7a2013-05-10 20:26:22 +00002959 }
drhaa32e3c2013-07-16 21:31:23 +00002960 pNew->nLTerm = 1;
2961 pNew->aLTerm[0] = pTerm;
2962 pNew->wsFlags = WHERE_MULTI_OR;
2963 pNew->rSetup = 0;
2964 pNew->iSortIdx = 0;
2965 memset(&pNew->u, 0, sizeof(pNew->u));
2966 for(i=0; rc==SQLITE_OK && i<sSum.n; i++){
dan5da73e12014-04-30 18:11:55 +00002967 /* TUNING: Currently sSum.a[i].rRun is set to the sum of the costs
2968 ** of all sub-scans required by the OR-scan. However, due to rounding
2969 ** errors, it may be that the cost of the OR-scan is equal to its
2970 ** most expensive sub-scan. Add the smallest possible penalty
2971 ** (equivalent to multiplying the cost by 1.07) to ensure that
2972 ** this does not happen. Otherwise, for WHERE clauses such as the
2973 ** following where there is an index on "y":
2974 **
2975 ** WHERE likelihood(x=?, 0.99) OR y=?
2976 **
2977 ** the planner may elect to "OR" together a full-table scan and an
2978 ** index lookup. And other similarly odd results. */
2979 pNew->rRun = sSum.a[i].rRun + 1;
drhaa32e3c2013-07-16 21:31:23 +00002980 pNew->nOut = sSum.a[i].nOut;
2981 pNew->prereq = sSum.a[i].prereq;
drhfd5874d2013-06-12 14:52:39 +00002982 rc = whereLoopInsert(pBuilder, pNew);
2983 }
drh0a99ba32014-09-30 17:03:35 +00002984 WHERETRACE(0x200, ("End processing OR-clause %p\n", pTerm));
drhcf8fa7a2013-05-10 20:26:22 +00002985 }
2986 }
2987 return rc;
2988}
2989
2990/*
drhf1b5f5b2013-05-02 00:15:01 +00002991** Add all WhereLoop objects for all tables
2992*/
drh5346e952013-05-08 14:14:26 +00002993static int whereLoopAddAll(WhereLoopBuilder *pBuilder){
drh70d18342013-06-06 19:16:33 +00002994 WhereInfo *pWInfo = pBuilder->pWInfo;
drhf1b5f5b2013-05-02 00:15:01 +00002995 Bitmask mExtra = 0;
2996 Bitmask mPrior = 0;
2997 int iTab;
drh70d18342013-06-06 19:16:33 +00002998 SrcList *pTabList = pWInfo->pTabList;
drhf1b5f5b2013-05-02 00:15:01 +00002999 struct SrcList_item *pItem;
dan4f20cd42015-06-08 18:05:54 +00003000 struct SrcList_item *pEnd = &pTabList->a[pWInfo->nLevel];
drh70d18342013-06-06 19:16:33 +00003001 sqlite3 *db = pWInfo->pParse->db;
drh5346e952013-05-08 14:14:26 +00003002 int rc = SQLITE_OK;
drhb8a8e8a2013-06-10 19:12:39 +00003003 WhereLoop *pNew;
dan35175bf2015-06-08 18:48:29 +00003004 u8 priorJointype = 0;
drhf1b5f5b2013-05-02 00:15:01 +00003005
3006 /* Loop over the tables in the join, from left to right */
drhb8a8e8a2013-06-10 19:12:39 +00003007 pNew = pBuilder->pNew;
drha2014152013-06-07 00:29:23 +00003008 whereLoopInit(pNew);
dan4f20cd42015-06-08 18:05:54 +00003009 for(iTab=0, pItem=pTabList->a; pItem<pEnd; iTab++, pItem++){
3010 Bitmask mUnusable = 0;
drhb2a90f02013-05-10 03:30:49 +00003011 pNew->iTab = iTab;
drh6f82e852015-06-06 20:12:09 +00003012 pNew->maskSelf = sqlite3WhereGetMask(&pWInfo->sMaskSet, pItem->iCursor);
drh8a48b9c2015-08-19 15:20:00 +00003013 if( ((pItem->fg.jointype|priorJointype) & (JT_LEFT|JT_CROSS))!=0 ){
dan4f20cd42015-06-08 18:05:54 +00003014 /* This condition is true when pItem is the FROM clause term on the
3015 ** right-hand-side of a LEFT or CROSS JOIN. */
drhf1b5f5b2013-05-02 00:15:01 +00003016 mExtra = mPrior;
3017 }
drh8a48b9c2015-08-19 15:20:00 +00003018 priorJointype = pItem->fg.jointype;
drhb2a90f02013-05-10 03:30:49 +00003019 if( IsVirtual(pItem->pTab) ){
dan4f20cd42015-06-08 18:05:54 +00003020 struct SrcList_item *p;
3021 for(p=&pItem[1]; p<pEnd; p++){
drh8a48b9c2015-08-19 15:20:00 +00003022 if( mUnusable || (p->fg.jointype & (JT_LEFT|JT_CROSS)) ){
dan4f20cd42015-06-08 18:05:54 +00003023 mUnusable |= sqlite3WhereGetMask(&pWInfo->sMaskSet, p->iCursor);
3024 }
3025 }
3026 rc = whereLoopAddVirtual(pBuilder, mExtra, mUnusable);
drhb2a90f02013-05-10 03:30:49 +00003027 }else{
3028 rc = whereLoopAddBtree(pBuilder, mExtra);
3029 }
drhb2a90f02013-05-10 03:30:49 +00003030 if( rc==SQLITE_OK ){
dan4f20cd42015-06-08 18:05:54 +00003031 rc = whereLoopAddOr(pBuilder, mExtra, mUnusable);
drhb2a90f02013-05-10 03:30:49 +00003032 }
drhb2a90f02013-05-10 03:30:49 +00003033 mPrior |= pNew->maskSelf;
drh5346e952013-05-08 14:14:26 +00003034 if( rc || db->mallocFailed ) break;
drhf1b5f5b2013-05-02 00:15:01 +00003035 }
dan4f20cd42015-06-08 18:05:54 +00003036
drha2014152013-06-07 00:29:23 +00003037 whereLoopClear(db, pNew);
drh5346e952013-05-08 14:14:26 +00003038 return rc;
drhf1b5f5b2013-05-02 00:15:01 +00003039}
3040
drha18f3d22013-05-08 03:05:41 +00003041/*
drh7699d1c2013-06-04 12:42:29 +00003042** Examine a WherePath (with the addition of the extra WhereLoop of the 5th
drh319f6772013-05-14 15:31:07 +00003043** parameters) to see if it outputs rows in the requested ORDER BY
drh0401ace2014-03-18 15:30:27 +00003044** (or GROUP BY) without requiring a separate sort operation. Return N:
drh319f6772013-05-14 15:31:07 +00003045**
drh0401ace2014-03-18 15:30:27 +00003046** N>0: N terms of the ORDER BY clause are satisfied
3047** N==0: No terms of the ORDER BY clause are satisfied
3048** N<0: Unknown yet how many terms of ORDER BY might be satisfied.
drh319f6772013-05-14 15:31:07 +00003049**
drh94433422013-07-01 11:05:50 +00003050** Note that processing for WHERE_GROUPBY and WHERE_DISTINCTBY is not as
3051** strict. With GROUP BY and DISTINCT the only requirement is that
3052** equivalent rows appear immediately adjacent to one another. GROUP BY
dan374cd782014-04-21 13:21:56 +00003053** and DISTINCT do not require rows to appear in any particular order as long
peter.d.reid60ec9142014-09-06 16:39:46 +00003054** as equivalent rows are grouped together. Thus for GROUP BY and DISTINCT
drh94433422013-07-01 11:05:50 +00003055** the pOrderBy terms can be matched in any order. With ORDER BY, the
3056** pOrderBy terms must be matched in strict left-to-right order.
drh6b7157b2013-05-10 02:00:35 +00003057*/
drh0401ace2014-03-18 15:30:27 +00003058static i8 wherePathSatisfiesOrderBy(
drh6b7157b2013-05-10 02:00:35 +00003059 WhereInfo *pWInfo, /* The WHERE clause */
drh4f402f22013-06-11 18:59:38 +00003060 ExprList *pOrderBy, /* ORDER BY or GROUP BY or DISTINCT clause to check */
drh6b7157b2013-05-10 02:00:35 +00003061 WherePath *pPath, /* The WherePath to check */
drh4f402f22013-06-11 18:59:38 +00003062 u16 wctrlFlags, /* Might contain WHERE_GROUPBY or WHERE_DISTINCTBY */
3063 u16 nLoop, /* Number of entries in pPath->aLoop[] */
drh319f6772013-05-14 15:31:07 +00003064 WhereLoop *pLast, /* Add this WhereLoop to the end of pPath->aLoop[] */
drh4f402f22013-06-11 18:59:38 +00003065 Bitmask *pRevMask /* OUT: Mask of WhereLoops to run in reverse order */
drh6b7157b2013-05-10 02:00:35 +00003066){
drh88da6442013-05-27 17:59:37 +00003067 u8 revSet; /* True if rev is known */
3068 u8 rev; /* Composite sort order */
3069 u8 revIdx; /* Index sort order */
drhe353ee32013-06-04 23:40:53 +00003070 u8 isOrderDistinct; /* All prior WhereLoops are order-distinct */
3071 u8 distinctColumns; /* True if the loop has UNIQUE NOT NULL columns */
3072 u8 isMatch; /* iColumn matches a term of the ORDER BY clause */
drh416846a2013-11-06 12:56:04 +00003073 u16 nKeyCol; /* Number of key columns in pIndex */
3074 u16 nColumn; /* Total number of ordered columns in the index */
drh7699d1c2013-06-04 12:42:29 +00003075 u16 nOrderBy; /* Number terms in the ORDER BY clause */
3076 int iLoop; /* Index of WhereLoop in pPath being processed */
3077 int i, j; /* Loop counters */
3078 int iCur; /* Cursor number for current WhereLoop */
3079 int iColumn; /* A column number within table iCur */
drhe8ae5832013-06-19 13:32:46 +00003080 WhereLoop *pLoop = 0; /* Current WhereLoop being processed. */
drh7699d1c2013-06-04 12:42:29 +00003081 WhereTerm *pTerm; /* A single term of the WHERE clause */
3082 Expr *pOBExpr; /* An expression from the ORDER BY clause */
3083 CollSeq *pColl; /* COLLATE function from an ORDER BY clause term */
3084 Index *pIndex; /* The index associated with pLoop */
3085 sqlite3 *db = pWInfo->pParse->db; /* Database connection */
3086 Bitmask obSat = 0; /* Mask of ORDER BY terms satisfied so far */
3087 Bitmask obDone; /* Mask of all ORDER BY terms */
drhe353ee32013-06-04 23:40:53 +00003088 Bitmask orderDistinctMask; /* Mask of all well-ordered loops */
drhb8916be2013-06-14 02:51:48 +00003089 Bitmask ready; /* Mask of inner loops */
drh319f6772013-05-14 15:31:07 +00003090
3091 /*
drh7699d1c2013-06-04 12:42:29 +00003092 ** We say the WhereLoop is "one-row" if it generates no more than one
3093 ** row of output. A WhereLoop is one-row if all of the following are true:
drh319f6772013-05-14 15:31:07 +00003094 ** (a) All index columns match with WHERE_COLUMN_EQ.
3095 ** (b) The index is unique
drh7699d1c2013-06-04 12:42:29 +00003096 ** Any WhereLoop with an WHERE_COLUMN_EQ constraint on the rowid is one-row.
3097 ** Every one-row WhereLoop will have the WHERE_ONEROW bit set in wsFlags.
drh319f6772013-05-14 15:31:07 +00003098 **
drhe353ee32013-06-04 23:40:53 +00003099 ** We say the WhereLoop is "order-distinct" if the set of columns from
3100 ** that WhereLoop that are in the ORDER BY clause are different for every
3101 ** row of the WhereLoop. Every one-row WhereLoop is automatically
3102 ** order-distinct. A WhereLoop that has no columns in the ORDER BY clause
3103 ** is not order-distinct. To be order-distinct is not quite the same as being
3104 ** UNIQUE since a UNIQUE column or index can have multiple rows that
3105 ** are NULL and NULL values are equivalent for the purpose of order-distinct.
3106 ** To be order-distinct, the columns must be UNIQUE and NOT NULL.
3107 **
3108 ** The rowid for a table is always UNIQUE and NOT NULL so whenever the
3109 ** rowid appears in the ORDER BY clause, the corresponding WhereLoop is
3110 ** automatically order-distinct.
drh319f6772013-05-14 15:31:07 +00003111 */
3112
3113 assert( pOrderBy!=0 );
drh7699d1c2013-06-04 12:42:29 +00003114 if( nLoop && OptimizationDisabled(db, SQLITE_OrderByIdxJoin) ) return 0;
drh319f6772013-05-14 15:31:07 +00003115
drh319f6772013-05-14 15:31:07 +00003116 nOrderBy = pOrderBy->nExpr;
drh7963b0e2013-06-17 21:37:40 +00003117 testcase( nOrderBy==BMS-1 );
drhe353ee32013-06-04 23:40:53 +00003118 if( nOrderBy>BMS-1 ) return 0; /* Cannot optimize overly large ORDER BYs */
3119 isOrderDistinct = 1;
drh7699d1c2013-06-04 12:42:29 +00003120 obDone = MASKBIT(nOrderBy)-1;
drhe353ee32013-06-04 23:40:53 +00003121 orderDistinctMask = 0;
drhb8916be2013-06-14 02:51:48 +00003122 ready = 0;
drhe353ee32013-06-04 23:40:53 +00003123 for(iLoop=0; isOrderDistinct && obSat<obDone && iLoop<=nLoop; iLoop++){
drhb8916be2013-06-14 02:51:48 +00003124 if( iLoop>0 ) ready |= pLoop->maskSelf;
drh7699d1c2013-06-04 12:42:29 +00003125 pLoop = iLoop<nLoop ? pPath->aLoop[iLoop] : pLast;
drh9dfaf622014-04-25 14:42:17 +00003126 if( pLoop->wsFlags & WHERE_VIRTUALTABLE ){
3127 if( pLoop->u.vtab.isOrdered ) obSat = obDone;
3128 break;
3129 }
drh319f6772013-05-14 15:31:07 +00003130 iCur = pWInfo->pTabList->a[pLoop->iTab].iCursor;
drhb8916be2013-06-14 02:51:48 +00003131
3132 /* Mark off any ORDER BY term X that is a column in the table of
3133 ** the current loop for which there is term in the WHERE
3134 ** clause of the form X IS NULL or X=? that reference only outer
3135 ** loops.
3136 */
3137 for(i=0; i<nOrderBy; i++){
3138 if( MASKBIT(i) & obSat ) continue;
3139 pOBExpr = sqlite3ExprSkipCollate(pOrderBy->a[i].pExpr);
3140 if( pOBExpr->op!=TK_COLUMN ) continue;
3141 if( pOBExpr->iTable!=iCur ) continue;
drh6f82e852015-06-06 20:12:09 +00003142 pTerm = sqlite3WhereFindTerm(&pWInfo->sWC, iCur, pOBExpr->iColumn,
drhe8d0c612015-05-14 01:05:25 +00003143 ~ready, WO_EQ|WO_ISNULL|WO_IS, 0);
drhb8916be2013-06-14 02:51:48 +00003144 if( pTerm==0 ) continue;
drhe8d0c612015-05-14 01:05:25 +00003145 if( (pTerm->eOperator&(WO_EQ|WO_IS))!=0 && pOBExpr->iColumn>=0 ){
drhb8916be2013-06-14 02:51:48 +00003146 const char *z1, *z2;
3147 pColl = sqlite3ExprCollSeq(pWInfo->pParse, pOrderBy->a[i].pExpr);
3148 if( !pColl ) pColl = db->pDfltColl;
3149 z1 = pColl->zName;
3150 pColl = sqlite3ExprCollSeq(pWInfo->pParse, pTerm->pExpr);
3151 if( !pColl ) pColl = db->pDfltColl;
3152 z2 = pColl->zName;
3153 if( sqlite3StrICmp(z1, z2)!=0 ) continue;
drhe0cc3c22015-05-13 17:54:08 +00003154 testcase( pTerm->pExpr->op==TK_IS );
drhb8916be2013-06-14 02:51:48 +00003155 }
3156 obSat |= MASKBIT(i);
3157 }
3158
drh7699d1c2013-06-04 12:42:29 +00003159 if( (pLoop->wsFlags & WHERE_ONEROW)==0 ){
3160 if( pLoop->wsFlags & WHERE_IPK ){
3161 pIndex = 0;
drhbbbdc832013-10-22 18:01:40 +00003162 nKeyCol = 0;
drh416846a2013-11-06 12:56:04 +00003163 nColumn = 1;
drh7699d1c2013-06-04 12:42:29 +00003164 }else if( (pIndex = pLoop->u.btree.pIndex)==0 || pIndex->bUnordered ){
drh1b0f0262013-05-30 22:27:09 +00003165 return 0;
drh7699d1c2013-06-04 12:42:29 +00003166 }else{
drhbbbdc832013-10-22 18:01:40 +00003167 nKeyCol = pIndex->nKeyCol;
drh416846a2013-11-06 12:56:04 +00003168 nColumn = pIndex->nColumn;
3169 assert( nColumn==nKeyCol+1 || !HasRowid(pIndex->pTable) );
3170 assert( pIndex->aiColumn[nColumn-1]==(-1) || !HasRowid(pIndex->pTable));
drh5f1d1d92014-07-31 22:59:04 +00003171 isOrderDistinct = IsUniqueIndex(pIndex);
drh1b0f0262013-05-30 22:27:09 +00003172 }
drh7699d1c2013-06-04 12:42:29 +00003173
drh7699d1c2013-06-04 12:42:29 +00003174 /* Loop through all columns of the index and deal with the ones
3175 ** that are not constrained by == or IN.
3176 */
3177 rev = revSet = 0;
drhe353ee32013-06-04 23:40:53 +00003178 distinctColumns = 0;
drh416846a2013-11-06 12:56:04 +00003179 for(j=0; j<nColumn; j++){
drh7699d1c2013-06-04 12:42:29 +00003180 u8 bOnce; /* True to run the ORDER BY search loop */
3181
drhe353ee32013-06-04 23:40:53 +00003182 /* Skip over == and IS NULL terms */
drh7699d1c2013-06-04 12:42:29 +00003183 if( j<pLoop->u.btree.nEq
drhc8bbce12014-10-21 01:05:09 +00003184 && pLoop->nSkip==0
drhe8d0c612015-05-14 01:05:25 +00003185 && ((i = pLoop->aLTerm[j]->eOperator) & (WO_EQ|WO_ISNULL|WO_IS))!=0
drh7699d1c2013-06-04 12:42:29 +00003186 ){
drh7963b0e2013-06-17 21:37:40 +00003187 if( i & WO_ISNULL ){
3188 testcase( isOrderDistinct );
3189 isOrderDistinct = 0;
3190 }
drhe353ee32013-06-04 23:40:53 +00003191 continue;
drh7699d1c2013-06-04 12:42:29 +00003192 }
3193
drhe353ee32013-06-04 23:40:53 +00003194 /* Get the column number in the table (iColumn) and sort order
3195 ** (revIdx) for the j-th column of the index.
drh7699d1c2013-06-04 12:42:29 +00003196 */
drh416846a2013-11-06 12:56:04 +00003197 if( pIndex ){
drh7699d1c2013-06-04 12:42:29 +00003198 iColumn = pIndex->aiColumn[j];
3199 revIdx = pIndex->aSortOrder[j];
3200 if( iColumn==pIndex->pTable->iPKey ) iColumn = -1;
drhdc3cd4b2013-05-30 23:21:20 +00003201 }else{
drh7699d1c2013-06-04 12:42:29 +00003202 iColumn = -1;
3203 revIdx = 0;
drhdc3cd4b2013-05-30 23:21:20 +00003204 }
drh7699d1c2013-06-04 12:42:29 +00003205
3206 /* An unconstrained column that might be NULL means that this
drh416846a2013-11-06 12:56:04 +00003207 ** WhereLoop is not well-ordered
drh7699d1c2013-06-04 12:42:29 +00003208 */
drhe353ee32013-06-04 23:40:53 +00003209 if( isOrderDistinct
3210 && iColumn>=0
drh7699d1c2013-06-04 12:42:29 +00003211 && j>=pLoop->u.btree.nEq
3212 && pIndex->pTable->aCol[iColumn].notNull==0
3213 ){
drhe353ee32013-06-04 23:40:53 +00003214 isOrderDistinct = 0;
drh7699d1c2013-06-04 12:42:29 +00003215 }
3216
3217 /* Find the ORDER BY term that corresponds to the j-th column
dan374cd782014-04-21 13:21:56 +00003218 ** of the index and mark that ORDER BY term off
drh7699d1c2013-06-04 12:42:29 +00003219 */
3220 bOnce = 1;
drhe353ee32013-06-04 23:40:53 +00003221 isMatch = 0;
drh7699d1c2013-06-04 12:42:29 +00003222 for(i=0; bOnce && i<nOrderBy; i++){
3223 if( MASKBIT(i) & obSat ) continue;
3224 pOBExpr = sqlite3ExprSkipCollate(pOrderBy->a[i].pExpr);
drh93ec45d2013-06-17 18:20:48 +00003225 testcase( wctrlFlags & WHERE_GROUPBY );
3226 testcase( wctrlFlags & WHERE_DISTINCTBY );
drh4f402f22013-06-11 18:59:38 +00003227 if( (wctrlFlags & (WHERE_GROUPBY|WHERE_DISTINCTBY))==0 ) bOnce = 0;
drhe353ee32013-06-04 23:40:53 +00003228 if( pOBExpr->op!=TK_COLUMN ) continue;
drh7699d1c2013-06-04 12:42:29 +00003229 if( pOBExpr->iTable!=iCur ) continue;
3230 if( pOBExpr->iColumn!=iColumn ) continue;
3231 if( iColumn>=0 ){
3232 pColl = sqlite3ExprCollSeq(pWInfo->pParse, pOrderBy->a[i].pExpr);
3233 if( !pColl ) pColl = db->pDfltColl;
3234 if( sqlite3StrICmp(pColl->zName, pIndex->azColl[j])!=0 ) continue;
3235 }
drhe353ee32013-06-04 23:40:53 +00003236 isMatch = 1;
drh7699d1c2013-06-04 12:42:29 +00003237 break;
3238 }
drh49290472014-10-11 02:12:58 +00003239 if( isMatch && (wctrlFlags & WHERE_GROUPBY)==0 ){
drh59b8f2e2014-03-22 00:27:14 +00003240 /* Make sure the sort order is compatible in an ORDER BY clause.
3241 ** Sort order is irrelevant for a GROUP BY clause. */
3242 if( revSet ){
3243 if( (rev ^ revIdx)!=pOrderBy->a[i].sortOrder ) isMatch = 0;
3244 }else{
3245 rev = revIdx ^ pOrderBy->a[i].sortOrder;
3246 if( rev ) *pRevMask |= MASKBIT(iLoop);
3247 revSet = 1;
3248 }
3249 }
drhe353ee32013-06-04 23:40:53 +00003250 if( isMatch ){
drh7963b0e2013-06-17 21:37:40 +00003251 if( iColumn<0 ){
3252 testcase( distinctColumns==0 );
3253 distinctColumns = 1;
3254 }
drh7699d1c2013-06-04 12:42:29 +00003255 obSat |= MASKBIT(i);
drh7699d1c2013-06-04 12:42:29 +00003256 }else{
3257 /* No match found */
drhbbbdc832013-10-22 18:01:40 +00003258 if( j==0 || j<nKeyCol ){
drh7963b0e2013-06-17 21:37:40 +00003259 testcase( isOrderDistinct!=0 );
3260 isOrderDistinct = 0;
3261 }
drh7699d1c2013-06-04 12:42:29 +00003262 break;
3263 }
3264 } /* end Loop over all index columns */
drh81186b42013-06-18 01:52:41 +00003265 if( distinctColumns ){
3266 testcase( isOrderDistinct==0 );
3267 isOrderDistinct = 1;
3268 }
drh7699d1c2013-06-04 12:42:29 +00003269 } /* end-if not one-row */
3270
3271 /* Mark off any other ORDER BY terms that reference pLoop */
drhe353ee32013-06-04 23:40:53 +00003272 if( isOrderDistinct ){
3273 orderDistinctMask |= pLoop->maskSelf;
drh7699d1c2013-06-04 12:42:29 +00003274 for(i=0; i<nOrderBy; i++){
3275 Expr *p;
drh434a9312014-02-26 02:26:09 +00003276 Bitmask mTerm;
drh7699d1c2013-06-04 12:42:29 +00003277 if( MASKBIT(i) & obSat ) continue;
3278 p = pOrderBy->a[i].pExpr;
drh6c1f4ef2015-06-08 14:23:15 +00003279 mTerm = sqlite3WhereExprUsage(&pWInfo->sMaskSet,p);
drh434a9312014-02-26 02:26:09 +00003280 if( mTerm==0 && !sqlite3ExprIsConstant(p) ) continue;
3281 if( (mTerm&~orderDistinctMask)==0 ){
drh7699d1c2013-06-04 12:42:29 +00003282 obSat |= MASKBIT(i);
3283 }
drh0afb4232013-05-31 13:36:32 +00003284 }
drh319f6772013-05-14 15:31:07 +00003285 }
drhb8916be2013-06-14 02:51:48 +00003286 } /* End the loop over all WhereLoops from outer-most down to inner-most */
drh36ed0342014-03-28 12:56:57 +00003287 if( obSat==obDone ) return (i8)nOrderBy;
drhd2de8612014-03-18 18:59:07 +00003288 if( !isOrderDistinct ){
3289 for(i=nOrderBy-1; i>0; i--){
3290 Bitmask m = MASKBIT(i) - 1;
3291 if( (obSat&m)==m ) return i;
3292 }
3293 return 0;
3294 }
drh319f6772013-05-14 15:31:07 +00003295 return -1;
drh6b7157b2013-05-10 02:00:35 +00003296}
3297
dan374cd782014-04-21 13:21:56 +00003298
3299/*
3300** If the WHERE_GROUPBY flag is set in the mask passed to sqlite3WhereBegin(),
3301** the planner assumes that the specified pOrderBy list is actually a GROUP
3302** BY clause - and so any order that groups rows as required satisfies the
3303** request.
3304**
3305** Normally, in this case it is not possible for the caller to determine
3306** whether or not the rows are really being delivered in sorted order, or
3307** just in some other order that provides the required grouping. However,
3308** if the WHERE_SORTBYGROUP flag is also passed to sqlite3WhereBegin(), then
3309** this function may be called on the returned WhereInfo object. It returns
3310** true if the rows really will be sorted in the specified order, or false
3311** otherwise.
3312**
3313** For example, assuming:
3314**
3315** CREATE INDEX i1 ON t1(x, Y);
3316**
3317** then
3318**
3319** SELECT * FROM t1 GROUP BY x,y ORDER BY x,y; -- IsSorted()==1
3320** SELECT * FROM t1 GROUP BY y,x ORDER BY y,x; -- IsSorted()==0
3321*/
3322int sqlite3WhereIsSorted(WhereInfo *pWInfo){
3323 assert( pWInfo->wctrlFlags & WHERE_GROUPBY );
3324 assert( pWInfo->wctrlFlags & WHERE_SORTBYGROUP );
3325 return pWInfo->sorted;
3326}
3327
drhd15cb172013-05-21 19:23:10 +00003328#ifdef WHERETRACE_ENABLED
3329/* For debugging use only: */
3330static const char *wherePathName(WherePath *pPath, int nLoop, WhereLoop *pLast){
3331 static char zName[65];
3332 int i;
3333 for(i=0; i<nLoop; i++){ zName[i] = pPath->aLoop[i]->cId; }
3334 if( pLast ) zName[i++] = pLast->cId;
3335 zName[i] = 0;
3336 return zName;
3337}
3338#endif
3339
drh6b7157b2013-05-10 02:00:35 +00003340/*
dan50ae31e2014-08-08 16:52:28 +00003341** Return the cost of sorting nRow rows, assuming that the keys have
3342** nOrderby columns and that the first nSorted columns are already in
3343** order.
3344*/
3345static LogEst whereSortingCost(
3346 WhereInfo *pWInfo,
3347 LogEst nRow,
3348 int nOrderBy,
3349 int nSorted
3350){
3351 /* TUNING: Estimated cost of a full external sort, where N is
3352 ** the number of rows to sort is:
3353 **
3354 ** cost = (3.0 * N * log(N)).
3355 **
3356 ** Or, if the order-by clause has X terms but only the last Y
3357 ** terms are out of order, then block-sorting will reduce the
3358 ** sorting cost to:
3359 **
3360 ** cost = (3.0 * N * log(N)) * (Y/X)
3361 **
3362 ** The (Y/X) term is implemented using stack variable rScale
3363 ** below. */
3364 LogEst rScale, rSortCost;
3365 assert( nOrderBy>0 && 66==sqlite3LogEst(100) );
3366 rScale = sqlite3LogEst((nOrderBy-nSorted)*100/nOrderBy) - 66;
3367 rSortCost = nRow + estLog(nRow) + rScale + 16;
3368
3369 /* TUNING: The cost of implementing DISTINCT using a B-TREE is
3370 ** similar but with a larger constant of proportionality.
3371 ** Multiply by an additional factor of 3.0. */
3372 if( pWInfo->wctrlFlags & WHERE_WANT_DISTINCT ){
3373 rSortCost += 16;
3374 }
3375
3376 return rSortCost;
3377}
3378
3379/*
dan51576f42013-07-02 10:06:15 +00003380** Given the list of WhereLoop objects at pWInfo->pLoops, this routine
drha18f3d22013-05-08 03:05:41 +00003381** attempts to find the lowest cost path that visits each WhereLoop
3382** once. This path is then loaded into the pWInfo->a[].pWLoop fields.
3383**
drhc7f0d222013-06-19 03:27:12 +00003384** Assume that the total number of output rows that will need to be sorted
3385** will be nRowEst (in the 10*log2 representation). Or, ignore sorting
3386** costs if nRowEst==0.
3387**
drha18f3d22013-05-08 03:05:41 +00003388** Return SQLITE_OK on success or SQLITE_NOMEM of a memory allocation
3389** error occurs.
3390*/
drhbf539c42013-10-05 18:16:02 +00003391static int wherePathSolver(WhereInfo *pWInfo, LogEst nRowEst){
drh783dece2013-06-05 17:53:43 +00003392 int mxChoice; /* Maximum number of simultaneous paths tracked */
drha18f3d22013-05-08 03:05:41 +00003393 int nLoop; /* Number of terms in the join */
drhe1e2e9a2013-06-13 15:16:53 +00003394 Parse *pParse; /* Parsing context */
drha18f3d22013-05-08 03:05:41 +00003395 sqlite3 *db; /* The database connection */
3396 int iLoop; /* Loop counter over the terms of the join */
3397 int ii, jj; /* Loop counters */
drhfde1e6b2013-09-06 17:45:42 +00003398 int mxI = 0; /* Index of next entry to replace */
drhd2de8612014-03-18 18:59:07 +00003399 int nOrderBy; /* Number of ORDER BY clause terms */
drhbf539c42013-10-05 18:16:02 +00003400 LogEst mxCost = 0; /* Maximum cost of a set of paths */
dan50ae31e2014-08-08 16:52:28 +00003401 LogEst mxUnsorted = 0; /* Maximum unsorted cost of a set of path */
drha18f3d22013-05-08 03:05:41 +00003402 int nTo, nFrom; /* Number of valid entries in aTo[] and aFrom[] */
3403 WherePath *aFrom; /* All nFrom paths at the previous level */
3404 WherePath *aTo; /* The nTo best paths at the current level */
3405 WherePath *pFrom; /* An element of aFrom[] that we are working on */
3406 WherePath *pTo; /* An element of aTo[] that we are working on */
3407 WhereLoop *pWLoop; /* One of the WhereLoop objects */
3408 WhereLoop **pX; /* Used to divy up the pSpace memory */
dan50ae31e2014-08-08 16:52:28 +00003409 LogEst *aSortCost = 0; /* Sorting and partial sorting costs */
drha18f3d22013-05-08 03:05:41 +00003410 char *pSpace; /* Temporary memory used by this routine */
dane2c27852014-08-08 17:25:33 +00003411 int nSpace; /* Bytes of space allocated at pSpace */
drha18f3d22013-05-08 03:05:41 +00003412
drhe1e2e9a2013-06-13 15:16:53 +00003413 pParse = pWInfo->pParse;
3414 db = pParse->db;
drha18f3d22013-05-08 03:05:41 +00003415 nLoop = pWInfo->nLevel;
drhe1e2e9a2013-06-13 15:16:53 +00003416 /* TUNING: For simple queries, only the best path is tracked.
3417 ** For 2-way joins, the 5 best paths are followed.
3418 ** For joins of 3 or more tables, track the 10 best paths */
drh2504c6c2014-06-02 11:26:33 +00003419 mxChoice = (nLoop<=1) ? 1 : (nLoop==2 ? 5 : 10);
drha18f3d22013-05-08 03:05:41 +00003420 assert( nLoop<=pWInfo->pTabList->nSrc );
drhddef5dc2014-08-07 16:50:00 +00003421 WHERETRACE(0x002, ("---- begin solver. (nRowEst=%d)\n", nRowEst));
drha18f3d22013-05-08 03:05:41 +00003422
dan50ae31e2014-08-08 16:52:28 +00003423 /* If nRowEst is zero and there is an ORDER BY clause, ignore it. In this
3424 ** case the purpose of this call is to estimate the number of rows returned
3425 ** by the overall query. Once this estimate has been obtained, the caller
3426 ** will invoke this function a second time, passing the estimate as the
3427 ** nRowEst parameter. */
3428 if( pWInfo->pOrderBy==0 || nRowEst==0 ){
3429 nOrderBy = 0;
3430 }else{
3431 nOrderBy = pWInfo->pOrderBy->nExpr;
3432 }
3433
3434 /* Allocate and initialize space for aTo, aFrom and aSortCost[] */
dane2c27852014-08-08 17:25:33 +00003435 nSpace = (sizeof(WherePath)+sizeof(WhereLoop*)*nLoop)*mxChoice*2;
3436 nSpace += sizeof(LogEst) * nOrderBy;
3437 pSpace = sqlite3DbMallocRaw(db, nSpace);
drha18f3d22013-05-08 03:05:41 +00003438 if( pSpace==0 ) return SQLITE_NOMEM;
3439 aTo = (WherePath*)pSpace;
3440 aFrom = aTo+mxChoice;
3441 memset(aFrom, 0, sizeof(aFrom[0]));
3442 pX = (WhereLoop**)(aFrom+mxChoice);
drhe9d935a2013-06-05 16:19:59 +00003443 for(ii=mxChoice*2, pFrom=aTo; ii>0; ii--, pFrom++, pX += nLoop){
drha18f3d22013-05-08 03:05:41 +00003444 pFrom->aLoop = pX;
3445 }
dan50ae31e2014-08-08 16:52:28 +00003446 if( nOrderBy ){
3447 /* If there is an ORDER BY clause and it is not being ignored, set up
3448 ** space for the aSortCost[] array. Each element of the aSortCost array
3449 ** is either zero - meaning it has not yet been initialized - or the
3450 ** cost of sorting nRowEst rows of data where the first X terms of
3451 ** the ORDER BY clause are already in order, where X is the array
3452 ** index. */
3453 aSortCost = (LogEst*)pX;
dane2c27852014-08-08 17:25:33 +00003454 memset(aSortCost, 0, sizeof(LogEst) * nOrderBy);
dan50ae31e2014-08-08 16:52:28 +00003455 }
dane2c27852014-08-08 17:25:33 +00003456 assert( aSortCost==0 || &pSpace[nSpace]==(char*)&aSortCost[nOrderBy] );
3457 assert( aSortCost!=0 || &pSpace[nSpace]==(char*)pX );
drha18f3d22013-05-08 03:05:41 +00003458
drhe1e2e9a2013-06-13 15:16:53 +00003459 /* Seed the search with a single WherePath containing zero WhereLoops.
3460 **
danf104abb2015-03-16 20:40:00 +00003461 ** TUNING: Do not let the number of iterations go above 28. If the cost
3462 ** of computing an automatic index is not paid back within the first 28
drhe1e2e9a2013-06-13 15:16:53 +00003463 ** rows, then do not use the automatic index. */
danf104abb2015-03-16 20:40:00 +00003464 aFrom[0].nRow = MIN(pParse->nQueryLoop, 48); assert( 48==sqlite3LogEst(28) );
drha18f3d22013-05-08 03:05:41 +00003465 nFrom = 1;
dan50ae31e2014-08-08 16:52:28 +00003466 assert( aFrom[0].isOrdered==0 );
3467 if( nOrderBy ){
3468 /* If nLoop is zero, then there are no FROM terms in the query. Since
3469 ** in this case the query may return a maximum of one row, the results
3470 ** are already in the requested order. Set isOrdered to nOrderBy to
3471 ** indicate this. Or, if nLoop is greater than zero, set isOrdered to
3472 ** -1, indicating that the result set may or may not be ordered,
3473 ** depending on the loops added to the current plan. */
3474 aFrom[0].isOrdered = nLoop>0 ? -1 : nOrderBy;
drh6b7157b2013-05-10 02:00:35 +00003475 }
3476
3477 /* Compute successively longer WherePaths using the previous generation
3478 ** of WherePaths as the basis for the next. Keep track of the mxChoice
3479 ** best paths at each generation */
drha18f3d22013-05-08 03:05:41 +00003480 for(iLoop=0; iLoop<nLoop; iLoop++){
3481 nTo = 0;
3482 for(ii=0, pFrom=aFrom; ii<nFrom; ii++, pFrom++){
3483 for(pWLoop=pWInfo->pLoops; pWLoop; pWLoop=pWLoop->pNextLoop){
dan50ae31e2014-08-08 16:52:28 +00003484 LogEst nOut; /* Rows visited by (pFrom+pWLoop) */
3485 LogEst rCost; /* Cost of path (pFrom+pWLoop) */
3486 LogEst rUnsorted; /* Unsorted cost of (pFrom+pWLoop) */
3487 i8 isOrdered = pFrom->isOrdered; /* isOrdered for (pFrom+pWLoop) */
3488 Bitmask maskNew; /* Mask of src visited by (..) */
3489 Bitmask revMask = 0; /* Mask of rev-order loops for (..) */
3490
drha18f3d22013-05-08 03:05:41 +00003491 if( (pWLoop->prereq & ~pFrom->maskLoop)!=0 ) continue;
3492 if( (pWLoop->maskSelf & pFrom->maskLoop)!=0 ) continue;
drh6b7157b2013-05-10 02:00:35 +00003493 /* At this point, pWLoop is a candidate to be the next loop.
3494 ** Compute its cost */
dan50ae31e2014-08-08 16:52:28 +00003495 rUnsorted = sqlite3LogEstAdd(pWLoop->rSetup,pWLoop->rRun + pFrom->nRow);
3496 rUnsorted = sqlite3LogEstAdd(rUnsorted, pFrom->rUnsorted);
drhfde1e6b2013-09-06 17:45:42 +00003497 nOut = pFrom->nRow + pWLoop->nOut;
drha18f3d22013-05-08 03:05:41 +00003498 maskNew = pFrom->maskLoop | pWLoop->maskSelf;
drh0401ace2014-03-18 15:30:27 +00003499 if( isOrdered<0 ){
3500 isOrdered = wherePathSatisfiesOrderBy(pWInfo,
drh4f402f22013-06-11 18:59:38 +00003501 pWInfo->pOrderBy, pFrom, pWInfo->wctrlFlags,
drh0401ace2014-03-18 15:30:27 +00003502 iLoop, pWLoop, &revMask);
drh3a5ba8b2013-06-03 15:34:48 +00003503 }else{
3504 revMask = pFrom->revLoop;
drh6b7157b2013-05-10 02:00:35 +00003505 }
dan50ae31e2014-08-08 16:52:28 +00003506 if( isOrdered>=0 && isOrdered<nOrderBy ){
3507 if( aSortCost[isOrdered]==0 ){
3508 aSortCost[isOrdered] = whereSortingCost(
3509 pWInfo, nRowEst, nOrderBy, isOrdered
3510 );
3511 }
3512 rCost = sqlite3LogEstAdd(rUnsorted, aSortCost[isOrdered]);
3513
3514 WHERETRACE(0x002,
3515 ("---- sort cost=%-3d (%d/%d) increases cost %3d to %-3d\n",
3516 aSortCost[isOrdered], (nOrderBy-isOrdered), nOrderBy,
3517 rUnsorted, rCost));
3518 }else{
3519 rCost = rUnsorted;
3520 }
3521
drhddef5dc2014-08-07 16:50:00 +00003522 /* Check to see if pWLoop should be added to the set of
3523 ** mxChoice best-so-far paths.
3524 **
3525 ** First look for an existing path among best-so-far paths
3526 ** that covers the same set of loops and has the same isOrdered
3527 ** setting as the current path candidate.
drhf2a90302014-08-07 20:37:01 +00003528 **
3529 ** The term "((pTo->isOrdered^isOrdered)&0x80)==0" is equivalent
3530 ** to (pTo->isOrdered==(-1))==(isOrdered==(-1))" for the range
3531 ** of legal values for isOrdered, -1..64.
drhddef5dc2014-08-07 16:50:00 +00003532 */
drh6b7157b2013-05-10 02:00:35 +00003533 for(jj=0, pTo=aTo; jj<nTo; jj++, pTo++){
drhfde1e6b2013-09-06 17:45:42 +00003534 if( pTo->maskLoop==maskNew
drhf2a90302014-08-07 20:37:01 +00003535 && ((pTo->isOrdered^isOrdered)&0x80)==0
drhfde1e6b2013-09-06 17:45:42 +00003536 ){
drh7963b0e2013-06-17 21:37:40 +00003537 testcase( jj==nTo-1 );
drh6b7157b2013-05-10 02:00:35 +00003538 break;
3539 }
3540 }
drha18f3d22013-05-08 03:05:41 +00003541 if( jj>=nTo ){
drhddef5dc2014-08-07 16:50:00 +00003542 /* None of the existing best-so-far paths match the candidate. */
drhddef5dc2014-08-07 16:50:00 +00003543 if( nTo>=mxChoice
dan50ae31e2014-08-08 16:52:28 +00003544 && (rCost>mxCost || (rCost==mxCost && rUnsorted>=mxUnsorted))
drhddef5dc2014-08-07 16:50:00 +00003545 ){
3546 /* The current candidate is no better than any of the mxChoice
3547 ** paths currently in the best-so-far buffer. So discard
3548 ** this candidate as not viable. */
drh989578e2013-10-28 14:34:35 +00003549#ifdef WHERETRACE_ENABLED /* 0x4 */
drhae70cf12013-05-31 15:18:46 +00003550 if( sqlite3WhereTrace&0x4 ){
drhfde1e6b2013-09-06 17:45:42 +00003551 sqlite3DebugPrintf("Skip %s cost=%-3d,%3d order=%c\n",
3552 wherePathName(pFrom, iLoop, pWLoop), rCost, nOut,
drh0401ace2014-03-18 15:30:27 +00003553 isOrdered>=0 ? isOrdered+'0' : '?');
drhd15cb172013-05-21 19:23:10 +00003554 }
3555#endif
3556 continue;
3557 }
drhddef5dc2014-08-07 16:50:00 +00003558 /* If we reach this points it means that the new candidate path
3559 ** needs to be added to the set of best-so-far paths. */
drha18f3d22013-05-08 03:05:41 +00003560 if( nTo<mxChoice ){
drhd15cb172013-05-21 19:23:10 +00003561 /* Increase the size of the aTo set by one */
drha18f3d22013-05-08 03:05:41 +00003562 jj = nTo++;
3563 }else{
drhd15cb172013-05-21 19:23:10 +00003564 /* New path replaces the prior worst to keep count below mxChoice */
drhfde1e6b2013-09-06 17:45:42 +00003565 jj = mxI;
drha18f3d22013-05-08 03:05:41 +00003566 }
3567 pTo = &aTo[jj];
drh989578e2013-10-28 14:34:35 +00003568#ifdef WHERETRACE_ENABLED /* 0x4 */
drhae70cf12013-05-31 15:18:46 +00003569 if( sqlite3WhereTrace&0x4 ){
drhfde1e6b2013-09-06 17:45:42 +00003570 sqlite3DebugPrintf("New %s cost=%-3d,%3d order=%c\n",
3571 wherePathName(pFrom, iLoop, pWLoop), rCost, nOut,
drh0401ace2014-03-18 15:30:27 +00003572 isOrdered>=0 ? isOrdered+'0' : '?');
drhd15cb172013-05-21 19:23:10 +00003573 }
3574#endif
drhf204dac2013-05-08 03:22:07 +00003575 }else{
drhddef5dc2014-08-07 16:50:00 +00003576 /* Control reaches here if best-so-far path pTo=aTo[jj] covers the
3577 ** same set of loops and has the sam isOrdered setting as the
3578 ** candidate path. Check to see if the candidate should replace
3579 ** pTo or if the candidate should be skipped */
3580 if( pTo->rCost<rCost || (pTo->rCost==rCost && pTo->nRow<=nOut) ){
drh989578e2013-10-28 14:34:35 +00003581#ifdef WHERETRACE_ENABLED /* 0x4 */
drhae70cf12013-05-31 15:18:46 +00003582 if( sqlite3WhereTrace&0x4 ){
drhd15cb172013-05-21 19:23:10 +00003583 sqlite3DebugPrintf(
drhfde1e6b2013-09-06 17:45:42 +00003584 "Skip %s cost=%-3d,%3d order=%c",
3585 wherePathName(pFrom, iLoop, pWLoop), rCost, nOut,
drh0401ace2014-03-18 15:30:27 +00003586 isOrdered>=0 ? isOrdered+'0' : '?');
drhfde1e6b2013-09-06 17:45:42 +00003587 sqlite3DebugPrintf(" vs %s cost=%-3d,%d order=%c\n",
3588 wherePathName(pTo, iLoop+1, 0), pTo->rCost, pTo->nRow,
drh0401ace2014-03-18 15:30:27 +00003589 pTo->isOrdered>=0 ? pTo->isOrdered+'0' : '?');
drhd15cb172013-05-21 19:23:10 +00003590 }
3591#endif
drhddef5dc2014-08-07 16:50:00 +00003592 /* Discard the candidate path from further consideration */
drh7963b0e2013-06-17 21:37:40 +00003593 testcase( pTo->rCost==rCost );
drhd15cb172013-05-21 19:23:10 +00003594 continue;
3595 }
drh7963b0e2013-06-17 21:37:40 +00003596 testcase( pTo->rCost==rCost+1 );
drhddef5dc2014-08-07 16:50:00 +00003597 /* Control reaches here if the candidate path is better than the
3598 ** pTo path. Replace pTo with the candidate. */
drh989578e2013-10-28 14:34:35 +00003599#ifdef WHERETRACE_ENABLED /* 0x4 */
drhae70cf12013-05-31 15:18:46 +00003600 if( sqlite3WhereTrace&0x4 ){
drhd15cb172013-05-21 19:23:10 +00003601 sqlite3DebugPrintf(
drhfde1e6b2013-09-06 17:45:42 +00003602 "Update %s cost=%-3d,%3d order=%c",
3603 wherePathName(pFrom, iLoop, pWLoop), rCost, nOut,
drh0401ace2014-03-18 15:30:27 +00003604 isOrdered>=0 ? isOrdered+'0' : '?');
drhfde1e6b2013-09-06 17:45:42 +00003605 sqlite3DebugPrintf(" was %s cost=%-3d,%3d order=%c\n",
3606 wherePathName(pTo, iLoop+1, 0), pTo->rCost, pTo->nRow,
drh0401ace2014-03-18 15:30:27 +00003607 pTo->isOrdered>=0 ? pTo->isOrdered+'0' : '?');
drhd15cb172013-05-21 19:23:10 +00003608 }
3609#endif
drha18f3d22013-05-08 03:05:41 +00003610 }
drh6b7157b2013-05-10 02:00:35 +00003611 /* pWLoop is a winner. Add it to the set of best so far */
drha18f3d22013-05-08 03:05:41 +00003612 pTo->maskLoop = pFrom->maskLoop | pWLoop->maskSelf;
drh319f6772013-05-14 15:31:07 +00003613 pTo->revLoop = revMask;
drhfde1e6b2013-09-06 17:45:42 +00003614 pTo->nRow = nOut;
drha18f3d22013-05-08 03:05:41 +00003615 pTo->rCost = rCost;
dan50ae31e2014-08-08 16:52:28 +00003616 pTo->rUnsorted = rUnsorted;
drh6b7157b2013-05-10 02:00:35 +00003617 pTo->isOrdered = isOrdered;
drha18f3d22013-05-08 03:05:41 +00003618 memcpy(pTo->aLoop, pFrom->aLoop, sizeof(WhereLoop*)*iLoop);
3619 pTo->aLoop[iLoop] = pWLoop;
3620 if( nTo>=mxChoice ){
drhfde1e6b2013-09-06 17:45:42 +00003621 mxI = 0;
drha18f3d22013-05-08 03:05:41 +00003622 mxCost = aTo[0].rCost;
dan50ae31e2014-08-08 16:52:28 +00003623 mxUnsorted = aTo[0].nRow;
drha18f3d22013-05-08 03:05:41 +00003624 for(jj=1, pTo=&aTo[1]; jj<mxChoice; jj++, pTo++){
dan50ae31e2014-08-08 16:52:28 +00003625 if( pTo->rCost>mxCost
3626 || (pTo->rCost==mxCost && pTo->rUnsorted>mxUnsorted)
3627 ){
drhfde1e6b2013-09-06 17:45:42 +00003628 mxCost = pTo->rCost;
dan50ae31e2014-08-08 16:52:28 +00003629 mxUnsorted = pTo->rUnsorted;
drhfde1e6b2013-09-06 17:45:42 +00003630 mxI = jj;
3631 }
drha18f3d22013-05-08 03:05:41 +00003632 }
3633 }
3634 }
3635 }
3636
drh989578e2013-10-28 14:34:35 +00003637#ifdef WHERETRACE_ENABLED /* >=2 */
drh1b131b72014-10-21 16:01:40 +00003638 if( sqlite3WhereTrace & 0x02 ){
drha50ef112013-05-22 02:06:59 +00003639 sqlite3DebugPrintf("---- after round %d ----\n", iLoop);
drhd15cb172013-05-21 19:23:10 +00003640 for(ii=0, pTo=aTo; ii<nTo; ii++, pTo++){
drhb8a8e8a2013-06-10 19:12:39 +00003641 sqlite3DebugPrintf(" %s cost=%-3d nrow=%-3d order=%c",
drha50ef112013-05-22 02:06:59 +00003642 wherePathName(pTo, iLoop+1, 0), pTo->rCost, pTo->nRow,
drh0401ace2014-03-18 15:30:27 +00003643 pTo->isOrdered>=0 ? (pTo->isOrdered+'0') : '?');
3644 if( pTo->isOrdered>0 ){
drh88da6442013-05-27 17:59:37 +00003645 sqlite3DebugPrintf(" rev=0x%llx\n", pTo->revLoop);
3646 }else{
3647 sqlite3DebugPrintf("\n");
3648 }
drhf204dac2013-05-08 03:22:07 +00003649 }
3650 }
3651#endif
3652
drh6b7157b2013-05-10 02:00:35 +00003653 /* Swap the roles of aFrom and aTo for the next generation */
drha18f3d22013-05-08 03:05:41 +00003654 pFrom = aTo;
3655 aTo = aFrom;
3656 aFrom = pFrom;
3657 nFrom = nTo;
3658 }
3659
drh75b93402013-05-31 20:43:57 +00003660 if( nFrom==0 ){
drhe1e2e9a2013-06-13 15:16:53 +00003661 sqlite3ErrorMsg(pParse, "no query solution");
drh75b93402013-05-31 20:43:57 +00003662 sqlite3DbFree(db, pSpace);
3663 return SQLITE_ERROR;
3664 }
drha18f3d22013-05-08 03:05:41 +00003665
drh6b7157b2013-05-10 02:00:35 +00003666 /* Find the lowest cost path. pFrom will be left pointing to that path */
drha18f3d22013-05-08 03:05:41 +00003667 pFrom = aFrom;
3668 for(ii=1; ii<nFrom; ii++){
3669 if( pFrom->rCost>aFrom[ii].rCost ) pFrom = &aFrom[ii];
3670 }
3671 assert( pWInfo->nLevel==nLoop );
drh6b7157b2013-05-10 02:00:35 +00003672 /* Load the lowest cost path into pWInfo */
drha18f3d22013-05-08 03:05:41 +00003673 for(iLoop=0; iLoop<nLoop; iLoop++){
drh7ba39a92013-05-30 17:43:19 +00003674 WhereLevel *pLevel = pWInfo->a + iLoop;
3675 pLevel->pWLoop = pWLoop = pFrom->aLoop[iLoop];
drhe217efc2013-06-12 03:48:41 +00003676 pLevel->iFrom = pWLoop->iTab;
drh7ba39a92013-05-30 17:43:19 +00003677 pLevel->iTabCur = pWInfo->pTabList->a[pLevel->iFrom].iCursor;
drha18f3d22013-05-08 03:05:41 +00003678 }
drhfd636c72013-06-21 02:05:06 +00003679 if( (pWInfo->wctrlFlags & WHERE_WANT_DISTINCT)!=0
3680 && (pWInfo->wctrlFlags & WHERE_DISTINCTBY)==0
3681 && pWInfo->eDistinct==WHERE_DISTINCT_NOOP
drh4f402f22013-06-11 18:59:38 +00003682 && nRowEst
3683 ){
3684 Bitmask notUsed;
drh6457a352013-06-21 00:35:37 +00003685 int rc = wherePathSatisfiesOrderBy(pWInfo, pWInfo->pResultSet, pFrom,
drh93ec45d2013-06-17 18:20:48 +00003686 WHERE_DISTINCTBY, nLoop-1, pFrom->aLoop[nLoop-1], &notUsed);
drh0401ace2014-03-18 15:30:27 +00003687 if( rc==pWInfo->pResultSet->nExpr ){
3688 pWInfo->eDistinct = WHERE_DISTINCT_ORDERED;
3689 }
drh4f402f22013-06-11 18:59:38 +00003690 }
drh079a3072014-03-19 14:10:55 +00003691 if( pWInfo->pOrderBy ){
drh4f402f22013-06-11 18:59:38 +00003692 if( pWInfo->wctrlFlags & WHERE_DISTINCTBY ){
drh079a3072014-03-19 14:10:55 +00003693 if( pFrom->isOrdered==pWInfo->pOrderBy->nExpr ){
3694 pWInfo->eDistinct = WHERE_DISTINCT_ORDERED;
3695 }
drh4f402f22013-06-11 18:59:38 +00003696 }else{
drhddba0c22014-03-18 20:33:42 +00003697 pWInfo->nOBSat = pFrom->isOrdered;
drhea6c36e2014-03-19 14:30:55 +00003698 if( pWInfo->nOBSat<0 ) pWInfo->nOBSat = 0;
drh4f402f22013-06-11 18:59:38 +00003699 pWInfo->revMask = pFrom->revLoop;
3700 }
dan374cd782014-04-21 13:21:56 +00003701 if( (pWInfo->wctrlFlags & WHERE_SORTBYGROUP)
drh11b04812015-04-12 01:22:04 +00003702 && pWInfo->nOBSat==pWInfo->pOrderBy->nExpr && nLoop>0
dan374cd782014-04-21 13:21:56 +00003703 ){
danb6453202014-10-10 20:52:53 +00003704 Bitmask revMask = 0;
dan374cd782014-04-21 13:21:56 +00003705 int nOrder = wherePathSatisfiesOrderBy(pWInfo, pWInfo->pOrderBy,
danb6453202014-10-10 20:52:53 +00003706 pFrom, 0, nLoop-1, pFrom->aLoop[nLoop-1], &revMask
dan374cd782014-04-21 13:21:56 +00003707 );
3708 assert( pWInfo->sorted==0 );
danb6453202014-10-10 20:52:53 +00003709 if( nOrder==pWInfo->pOrderBy->nExpr ){
3710 pWInfo->sorted = 1;
3711 pWInfo->revMask = revMask;
3712 }
dan374cd782014-04-21 13:21:56 +00003713 }
drh6b7157b2013-05-10 02:00:35 +00003714 }
dan374cd782014-04-21 13:21:56 +00003715
3716
drha50ef112013-05-22 02:06:59 +00003717 pWInfo->nRowOut = pFrom->nRow;
drha18f3d22013-05-08 03:05:41 +00003718
3719 /* Free temporary memory and return success */
3720 sqlite3DbFree(db, pSpace);
3721 return SQLITE_OK;
3722}
drh94a11212004-09-25 13:12:14 +00003723
3724/*
drh60c96cd2013-06-09 17:21:25 +00003725** Most queries use only a single table (they are not joins) and have
3726** simple == constraints against indexed fields. This routine attempts
3727** to plan those simple cases using much less ceremony than the
3728** general-purpose query planner, and thereby yield faster sqlite3_prepare()
3729** times for the common case.
3730**
3731** Return non-zero on success, if this query can be handled by this
3732** no-frills query planner. Return zero if this query needs the
3733** general-purpose query planner.
3734*/
drhb8a8e8a2013-06-10 19:12:39 +00003735static int whereShortCut(WhereLoopBuilder *pBuilder){
drh60c96cd2013-06-09 17:21:25 +00003736 WhereInfo *pWInfo;
3737 struct SrcList_item *pItem;
3738 WhereClause *pWC;
3739 WhereTerm *pTerm;
3740 WhereLoop *pLoop;
3741 int iCur;
drh92a121f2013-06-10 12:15:47 +00003742 int j;
drh60c96cd2013-06-09 17:21:25 +00003743 Table *pTab;
3744 Index *pIdx;
3745
3746 pWInfo = pBuilder->pWInfo;
drh5822d6f2013-06-10 23:30:09 +00003747 if( pWInfo->wctrlFlags & WHERE_FORCE_TABLE ) return 0;
drh60c96cd2013-06-09 17:21:25 +00003748 assert( pWInfo->pTabList->nSrc>=1 );
3749 pItem = pWInfo->pTabList->a;
3750 pTab = pItem->pTab;
3751 if( IsVirtual(pTab) ) return 0;
drh8a48b9c2015-08-19 15:20:00 +00003752 if( pItem->fg.isIndexedBy ) return 0;
drh60c96cd2013-06-09 17:21:25 +00003753 iCur = pItem->iCursor;
3754 pWC = &pWInfo->sWC;
3755 pLoop = pBuilder->pNew;
drh60c96cd2013-06-09 17:21:25 +00003756 pLoop->wsFlags = 0;
drhc8bbce12014-10-21 01:05:09 +00003757 pLoop->nSkip = 0;
drh6f82e852015-06-06 20:12:09 +00003758 pTerm = sqlite3WhereFindTerm(pWC, iCur, -1, 0, WO_EQ|WO_IS, 0);
drh60c96cd2013-06-09 17:21:25 +00003759 if( pTerm ){
drhe8d0c612015-05-14 01:05:25 +00003760 testcase( pTerm->eOperator & WO_IS );
drh60c96cd2013-06-09 17:21:25 +00003761 pLoop->wsFlags = WHERE_COLUMN_EQ|WHERE_IPK|WHERE_ONEROW;
3762 pLoop->aLTerm[0] = pTerm;
3763 pLoop->nLTerm = 1;
3764 pLoop->u.btree.nEq = 1;
drhe1e2e9a2013-06-13 15:16:53 +00003765 /* TUNING: Cost of a rowid lookup is 10 */
drhbf539c42013-10-05 18:16:02 +00003766 pLoop->rRun = 33; /* 33==sqlite3LogEst(10) */
drh60c96cd2013-06-09 17:21:25 +00003767 }else{
3768 for(pIdx=pTab->pIndex; pIdx; pIdx=pIdx->pNext){
mistachkin4e5bef82015-05-15 20:14:00 +00003769 int opMask;
dancd40abb2013-08-29 10:46:05 +00003770 assert( pLoop->aLTermSpace==pLoop->aLTerm );
drh5f1d1d92014-07-31 22:59:04 +00003771 if( !IsUniqueIndex(pIdx)
dancd40abb2013-08-29 10:46:05 +00003772 || pIdx->pPartIdxWhere!=0
drhbbbdc832013-10-22 18:01:40 +00003773 || pIdx->nKeyCol>ArraySize(pLoop->aLTermSpace)
dancd40abb2013-08-29 10:46:05 +00003774 ) continue;
mistachkin4e5bef82015-05-15 20:14:00 +00003775 opMask = pIdx->uniqNotNull ? (WO_EQ|WO_IS) : WO_EQ;
drhbbbdc832013-10-22 18:01:40 +00003776 for(j=0; j<pIdx->nKeyCol; j++){
drh6f82e852015-06-06 20:12:09 +00003777 pTerm = sqlite3WhereFindTerm(pWC, iCur, pIdx->aiColumn[j], 0, opMask, pIdx);
drh60c96cd2013-06-09 17:21:25 +00003778 if( pTerm==0 ) break;
dan3072b532015-05-15 19:59:23 +00003779 testcase( pTerm->eOperator & WO_IS );
drh60c96cd2013-06-09 17:21:25 +00003780 pLoop->aLTerm[j] = pTerm;
3781 }
drhbbbdc832013-10-22 18:01:40 +00003782 if( j!=pIdx->nKeyCol ) continue;
drh92a121f2013-06-10 12:15:47 +00003783 pLoop->wsFlags = WHERE_COLUMN_EQ|WHERE_ONEROW|WHERE_INDEXED;
drhec95c442013-10-23 01:57:32 +00003784 if( pIdx->isCovering || (pItem->colUsed & ~columnsInIndex(pIdx))==0 ){
drh92a121f2013-06-10 12:15:47 +00003785 pLoop->wsFlags |= WHERE_IDX_ONLY;
3786 }
drh60c96cd2013-06-09 17:21:25 +00003787 pLoop->nLTerm = j;
3788 pLoop->u.btree.nEq = j;
3789 pLoop->u.btree.pIndex = pIdx;
drhe1e2e9a2013-06-13 15:16:53 +00003790 /* TUNING: Cost of a unique index lookup is 15 */
drhbf539c42013-10-05 18:16:02 +00003791 pLoop->rRun = 39; /* 39==sqlite3LogEst(15) */
drh60c96cd2013-06-09 17:21:25 +00003792 break;
3793 }
3794 }
drh3b75ffa2013-06-10 14:56:25 +00003795 if( pLoop->wsFlags ){
drhbf539c42013-10-05 18:16:02 +00003796 pLoop->nOut = (LogEst)1;
drh3b75ffa2013-06-10 14:56:25 +00003797 pWInfo->a[0].pWLoop = pLoop;
drh6f82e852015-06-06 20:12:09 +00003798 pLoop->maskSelf = sqlite3WhereGetMask(&pWInfo->sMaskSet, iCur);
drh3b75ffa2013-06-10 14:56:25 +00003799 pWInfo->a[0].iTabCur = iCur;
3800 pWInfo->nRowOut = 1;
drhddba0c22014-03-18 20:33:42 +00003801 if( pWInfo->pOrderBy ) pWInfo->nOBSat = pWInfo->pOrderBy->nExpr;
drh6457a352013-06-21 00:35:37 +00003802 if( pWInfo->wctrlFlags & WHERE_WANT_DISTINCT ){
3803 pWInfo->eDistinct = WHERE_DISTINCT_UNIQUE;
3804 }
drh3b75ffa2013-06-10 14:56:25 +00003805#ifdef SQLITE_DEBUG
3806 pLoop->cId = '0';
3807#endif
3808 return 1;
3809 }
3810 return 0;
drh60c96cd2013-06-09 17:21:25 +00003811}
3812
3813/*
drhe3184742002-06-19 14:27:05 +00003814** Generate the beginning of the loop used for WHERE clause processing.
drhacf3b982005-01-03 01:27:18 +00003815** The return value is a pointer to an opaque structure that contains
drh75897232000-05-29 14:26:00 +00003816** information needed to terminate the loop. Later, the calling routine
danielk19774adee202004-05-08 08:23:19 +00003817** should invoke sqlite3WhereEnd() with the return value of this function
drh75897232000-05-29 14:26:00 +00003818** in order to complete the WHERE clause processing.
3819**
3820** If an error occurs, this routine returns NULL.
drhc27a1ce2002-06-14 20:58:45 +00003821**
3822** The basic idea is to do a nested loop, one loop for each table in
3823** the FROM clause of a select. (INSERT and UPDATE statements are the
3824** same as a SELECT with only a single table in the FROM clause.) For
3825** example, if the SQL is this:
3826**
3827** SELECT * FROM t1, t2, t3 WHERE ...;
3828**
3829** Then the code generated is conceptually like the following:
3830**
3831** foreach row1 in t1 do \ Code generated
danielk19774adee202004-05-08 08:23:19 +00003832** foreach row2 in t2 do |-- by sqlite3WhereBegin()
drhc27a1ce2002-06-14 20:58:45 +00003833** foreach row3 in t3 do /
3834** ...
3835** end \ Code generated
danielk19774adee202004-05-08 08:23:19 +00003836** end |-- by sqlite3WhereEnd()
drhc27a1ce2002-06-14 20:58:45 +00003837** end /
3838**
drh29dda4a2005-07-21 18:23:20 +00003839** Note that the loops might not be nested in the order in which they
3840** appear in the FROM clause if a different order is better able to make
drh51147ba2005-07-23 22:59:55 +00003841** use of indices. Note also that when the IN operator appears in
3842** the WHERE clause, it might result in additional nested loops for
3843** scanning through all values on the right-hand side of the IN.
drh29dda4a2005-07-21 18:23:20 +00003844**
drhc27a1ce2002-06-14 20:58:45 +00003845** There are Btree cursors associated with each table. t1 uses cursor
drh6a3ea0e2003-05-02 14:32:12 +00003846** number pTabList->a[0].iCursor. t2 uses the cursor pTabList->a[1].iCursor.
3847** And so forth. This routine generates code to open those VDBE cursors
danielk19774adee202004-05-08 08:23:19 +00003848** and sqlite3WhereEnd() generates the code to close them.
drhc27a1ce2002-06-14 20:58:45 +00003849**
drhe6f85e72004-12-25 01:03:13 +00003850** The code that sqlite3WhereBegin() generates leaves the cursors named
3851** in pTabList pointing at their appropriate entries. The [...] code
drhf0863fe2005-06-12 21:35:51 +00003852** can use OP_Column and OP_Rowid opcodes on these cursors to extract
drhe6f85e72004-12-25 01:03:13 +00003853** data from the various tables of the loop.
3854**
drhc27a1ce2002-06-14 20:58:45 +00003855** If the WHERE clause is empty, the foreach loops must each scan their
3856** entire tables. Thus a three-way join is an O(N^3) operation. But if
3857** the tables have indices and there are terms in the WHERE clause that
3858** refer to those indices, a complete table scan can be avoided and the
3859** code will run much faster. Most of the work of this routine is checking
3860** to see if there are indices that can be used to speed up the loop.
3861**
3862** Terms of the WHERE clause are also used to limit which rows actually
3863** make it to the "..." in the middle of the loop. After each "foreach",
3864** terms of the WHERE clause that use only terms in that loop and outer
3865** loops are evaluated and if false a jump is made around all subsequent
3866** inner loops (or around the "..." if the test occurs within the inner-
3867** most loop)
3868**
3869** OUTER JOINS
3870**
3871** An outer join of tables t1 and t2 is conceptally coded as follows:
3872**
3873** foreach row1 in t1 do
3874** flag = 0
3875** foreach row2 in t2 do
3876** start:
3877** ...
3878** flag = 1
3879** end
drhe3184742002-06-19 14:27:05 +00003880** if flag==0 then
3881** move the row2 cursor to a null row
3882** goto start
3883** fi
drhc27a1ce2002-06-14 20:58:45 +00003884** end
3885**
drhe3184742002-06-19 14:27:05 +00003886** ORDER BY CLAUSE PROCESSING
3887**
drh94433422013-07-01 11:05:50 +00003888** pOrderBy is a pointer to the ORDER BY clause (or the GROUP BY clause
3889** if the WHERE_GROUPBY flag is set in wctrlFlags) of a SELECT statement
drhe3184742002-06-19 14:27:05 +00003890** if there is one. If there is no ORDER BY clause or if this routine
drh46ec5b62012-09-24 15:30:54 +00003891** is called from an UPDATE or DELETE statement, then pOrderBy is NULL.
drhfc8d4f92013-11-08 15:19:46 +00003892**
3893** The iIdxCur parameter is the cursor number of an index. If
3894** WHERE_ONETABLE_ONLY is set, iIdxCur is the cursor number of an index
3895** to use for OR clause processing. The WHERE clause should use this
3896** specific cursor. If WHERE_ONEPASS_DESIRED is set, then iIdxCur is
3897** the first cursor in an array of cursors for all indices. iIdxCur should
3898** be used to compute the appropriate cursor depending on which index is
3899** used.
drh75897232000-05-29 14:26:00 +00003900*/
danielk19774adee202004-05-08 08:23:19 +00003901WhereInfo *sqlite3WhereBegin(
danielk1977ed326d72004-11-16 15:50:19 +00003902 Parse *pParse, /* The parser context */
drh6457a352013-06-21 00:35:37 +00003903 SrcList *pTabList, /* FROM clause: A list of all tables to be scanned */
danielk1977ed326d72004-11-16 15:50:19 +00003904 Expr *pWhere, /* The WHERE clause */
drh0401ace2014-03-18 15:30:27 +00003905 ExprList *pOrderBy, /* An ORDER BY (or GROUP BY) clause, or NULL */
drh6457a352013-06-21 00:35:37 +00003906 ExprList *pResultSet, /* Result set of the query */
dan0efb72c2012-08-24 18:44:56 +00003907 u16 wctrlFlags, /* One of the WHERE_* flags defined in sqliteInt.h */
3908 int iIdxCur /* If WHERE_ONETABLE_ONLY is set, index cursor number */
drh75897232000-05-29 14:26:00 +00003909){
danielk1977be229652009-03-20 14:18:51 +00003910 int nByteWInfo; /* Num. bytes allocated for WhereInfo struct */
drhc01a3c12009-12-16 22:10:49 +00003911 int nTabList; /* Number of elements in pTabList */
drh75897232000-05-29 14:26:00 +00003912 WhereInfo *pWInfo; /* Will become the return value of this function */
3913 Vdbe *v = pParse->pVdbe; /* The virtual database engine */
drhfe05af82005-07-21 03:14:59 +00003914 Bitmask notReady; /* Cursors that are not yet positioned */
drh1c8148f2013-05-04 20:25:23 +00003915 WhereLoopBuilder sWLB; /* The WhereLoop builder */
drh111a6a72008-12-21 03:51:16 +00003916 WhereMaskSet *pMaskSet; /* The expression mask set */
drh56f1b992012-09-25 14:29:39 +00003917 WhereLevel *pLevel; /* A single level in pWInfo->a[] */
drhfd636c72013-06-21 02:05:06 +00003918 WhereLoop *pLoop; /* Pointer to a single WhereLoop object */
drh9cd1c992012-09-25 20:43:35 +00003919 int ii; /* Loop counter */
drh17435752007-08-16 04:30:38 +00003920 sqlite3 *db; /* Database connection */
drh5346e952013-05-08 14:14:26 +00003921 int rc; /* Return code */
drh75897232000-05-29 14:26:00 +00003922
drh56f1b992012-09-25 14:29:39 +00003923
3924 /* Variable initialization */
drhfd636c72013-06-21 02:05:06 +00003925 db = pParse->db;
drh1c8148f2013-05-04 20:25:23 +00003926 memset(&sWLB, 0, sizeof(sWLB));
drh0401ace2014-03-18 15:30:27 +00003927
3928 /* An ORDER/GROUP BY clause of more than 63 terms cannot be optimized */
3929 testcase( pOrderBy && pOrderBy->nExpr==BMS-1 );
3930 if( pOrderBy && pOrderBy->nExpr>=BMS ) pOrderBy = 0;
drh1c8148f2013-05-04 20:25:23 +00003931 sWLB.pOrderBy = pOrderBy;
drh56f1b992012-09-25 14:29:39 +00003932
drhfd636c72013-06-21 02:05:06 +00003933 /* Disable the DISTINCT optimization if SQLITE_DistinctOpt is set via
3934 ** sqlite3_test_ctrl(SQLITE_TESTCTRL_OPTIMIZATIONS,...) */
3935 if( OptimizationDisabled(db, SQLITE_DistinctOpt) ){
3936 wctrlFlags &= ~WHERE_WANT_DISTINCT;
3937 }
3938
drh29dda4a2005-07-21 18:23:20 +00003939 /* The number of tables in the FROM clause is limited by the number of
drh1398ad32005-01-19 23:24:50 +00003940 ** bits in a Bitmask
3941 */
drh67ae0cb2010-04-08 14:38:51 +00003942 testcase( pTabList->nSrc==BMS );
drh29dda4a2005-07-21 18:23:20 +00003943 if( pTabList->nSrc>BMS ){
3944 sqlite3ErrorMsg(pParse, "at most %d tables in a join", BMS);
drh1398ad32005-01-19 23:24:50 +00003945 return 0;
3946 }
3947
drhc01a3c12009-12-16 22:10:49 +00003948 /* This function normally generates a nested loop for all tables in
3949 ** pTabList. But if the WHERE_ONETABLE_ONLY flag is set, then we should
3950 ** only generate code for the first table in pTabList and assume that
3951 ** any cursors associated with subsequent tables are uninitialized.
3952 */
3953 nTabList = (wctrlFlags & WHERE_ONETABLE_ONLY) ? 1 : pTabList->nSrc;
3954
drh75897232000-05-29 14:26:00 +00003955 /* Allocate and initialize the WhereInfo structure that will become the
danielk1977be229652009-03-20 14:18:51 +00003956 ** return value. A single allocation is used to store the WhereInfo
3957 ** struct, the contents of WhereInfo.a[], the WhereClause structure
3958 ** and the WhereMaskSet structure. Since WhereClause contains an 8-byte
3959 ** field (type Bitmask) it must be aligned on an 8-byte boundary on
3960 ** some architectures. Hence the ROUND8() below.
drh75897232000-05-29 14:26:00 +00003961 */
drhc01a3c12009-12-16 22:10:49 +00003962 nByteWInfo = ROUND8(sizeof(WhereInfo)+(nTabList-1)*sizeof(WhereLevel));
drh60c96cd2013-06-09 17:21:25 +00003963 pWInfo = sqlite3DbMallocZero(db, nByteWInfo + sizeof(WhereLoop));
drh17435752007-08-16 04:30:38 +00003964 if( db->mallocFailed ){
drh8b307fb2010-04-06 15:57:05 +00003965 sqlite3DbFree(db, pWInfo);
3966 pWInfo = 0;
danielk197785574e32008-10-06 05:32:18 +00003967 goto whereBeginError;
drh75897232000-05-29 14:26:00 +00003968 }
drhfc8d4f92013-11-08 15:19:46 +00003969 pWInfo->aiCurOnePass[0] = pWInfo->aiCurOnePass[1] = -1;
drhc01a3c12009-12-16 22:10:49 +00003970 pWInfo->nLevel = nTabList;
drh75897232000-05-29 14:26:00 +00003971 pWInfo->pParse = pParse;
3972 pWInfo->pTabList = pTabList;
drh6b7157b2013-05-10 02:00:35 +00003973 pWInfo->pOrderBy = pOrderBy;
drh6457a352013-06-21 00:35:37 +00003974 pWInfo->pResultSet = pResultSet;
drha22a75e2014-03-21 18:16:23 +00003975 pWInfo->iBreak = pWInfo->iContinue = sqlite3VdbeMakeLabel(v);
drh6df2acd2008-12-28 16:55:25 +00003976 pWInfo->wctrlFlags = wctrlFlags;
drh8b307fb2010-04-06 15:57:05 +00003977 pWInfo->savedNQueryLoop = pParse->nQueryLoop;
drh70d18342013-06-06 19:16:33 +00003978 pMaskSet = &pWInfo->sMaskSet;
drh1c8148f2013-05-04 20:25:23 +00003979 sWLB.pWInfo = pWInfo;
drh70d18342013-06-06 19:16:33 +00003980 sWLB.pWC = &pWInfo->sWC;
drh1ac87e12013-07-18 14:50:56 +00003981 sWLB.pNew = (WhereLoop*)(((char*)pWInfo)+nByteWInfo);
3982 assert( EIGHT_BYTE_ALIGNMENT(sWLB.pNew) );
drh60c96cd2013-06-09 17:21:25 +00003983 whereLoopInit(sWLB.pNew);
drhb8a8e8a2013-06-10 19:12:39 +00003984#ifdef SQLITE_DEBUG
3985 sWLB.pNew->cId = '*';
3986#endif
drh08192d52002-04-30 19:20:28 +00003987
drh111a6a72008-12-21 03:51:16 +00003988 /* Split the WHERE clause into separate subexpressions where each
3989 ** subexpression is separated by an AND operator.
3990 */
3991 initMaskSet(pMaskSet);
drh6c1f4ef2015-06-08 14:23:15 +00003992 sqlite3WhereClauseInit(&pWInfo->sWC, pWInfo);
3993 sqlite3WhereSplit(&pWInfo->sWC, pWhere, TK_AND);
drh111a6a72008-12-21 03:51:16 +00003994
drh08192d52002-04-30 19:20:28 +00003995 /* Special case: a WHERE clause that is constant. Evaluate the
3996 ** expression and either jump over all of the code or fall thru.
3997 */
drh759e8582014-01-02 21:05:10 +00003998 for(ii=0; ii<sWLB.pWC->nTerm; ii++){
3999 if( nTabList==0 || sqlite3ExprIsConstantNotJoin(sWLB.pWC->a[ii].pExpr) ){
4000 sqlite3ExprIfFalse(pParse, sWLB.pWC->a[ii].pExpr, pWInfo->iBreak,
4001 SQLITE_JUMPIFNULL);
4002 sWLB.pWC->a[ii].wtFlags |= TERM_CODED;
4003 }
drh08192d52002-04-30 19:20:28 +00004004 }
drh75897232000-05-29 14:26:00 +00004005
drh4fe425a2013-06-12 17:08:06 +00004006 /* Special case: No FROM clause
4007 */
4008 if( nTabList==0 ){
drhddba0c22014-03-18 20:33:42 +00004009 if( pOrderBy ) pWInfo->nOBSat = pOrderBy->nExpr;
drh6457a352013-06-21 00:35:37 +00004010 if( wctrlFlags & WHERE_WANT_DISTINCT ){
4011 pWInfo->eDistinct = WHERE_DISTINCT_UNIQUE;
4012 }
drh4fe425a2013-06-12 17:08:06 +00004013 }
4014
drh42165be2008-03-26 14:56:34 +00004015 /* Assign a bit from the bitmask to every term in the FROM clause.
4016 **
4017 ** When assigning bitmask values to FROM clause cursors, it must be
4018 ** the case that if X is the bitmask for the N-th FROM clause term then
4019 ** the bitmask for all FROM clause terms to the left of the N-th term
4020 ** is (X-1). An expression from the ON clause of a LEFT JOIN can use
4021 ** its Expr.iRightJoinTable value to find the bitmask of the right table
4022 ** of the join. Subtracting one from the right table bitmask gives a
4023 ** bitmask for all tables to the left of the join. Knowing the bitmask
4024 ** for all tables to the left of a left join is important. Ticket #3015.
danielk1977e672c8e2009-05-22 15:43:26 +00004025 **
drhc01a3c12009-12-16 22:10:49 +00004026 ** Note that bitmasks are created for all pTabList->nSrc tables in
4027 ** pTabList, not just the first nTabList tables. nTabList is normally
4028 ** equal to pTabList->nSrc but might be shortened to 1 if the
4029 ** WHERE_ONETABLE_ONLY flag is set.
drh42165be2008-03-26 14:56:34 +00004030 */
drh9cd1c992012-09-25 20:43:35 +00004031 for(ii=0; ii<pTabList->nSrc; ii++){
4032 createMask(pMaskSet, pTabList->a[ii].iCursor);
drh42165be2008-03-26 14:56:34 +00004033 }
4034#ifndef NDEBUG
4035 {
4036 Bitmask toTheLeft = 0;
drh9cd1c992012-09-25 20:43:35 +00004037 for(ii=0; ii<pTabList->nSrc; ii++){
drh6f82e852015-06-06 20:12:09 +00004038 Bitmask m = sqlite3WhereGetMask(pMaskSet, pTabList->a[ii].iCursor);
drh42165be2008-03-26 14:56:34 +00004039 assert( (m-1)==toTheLeft );
4040 toTheLeft |= m;
4041 }
4042 }
4043#endif
4044
drhb121dd12015-06-06 18:30:17 +00004045 /* Analyze all of the subexpressions. */
drh6c1f4ef2015-06-08 14:23:15 +00004046 sqlite3WhereExprAnalyze(pTabList, &pWInfo->sWC);
drhb121dd12015-06-06 18:30:17 +00004047 if( db->mallocFailed ) goto whereBeginError;
drh75897232000-05-29 14:26:00 +00004048
drh6457a352013-06-21 00:35:37 +00004049 if( wctrlFlags & WHERE_WANT_DISTINCT ){
4050 if( isDistinctRedundant(pParse, pTabList, &pWInfo->sWC, pResultSet) ){
4051 /* The DISTINCT marking is pointless. Ignore it. */
drh4f402f22013-06-11 18:59:38 +00004052 pWInfo->eDistinct = WHERE_DISTINCT_UNIQUE;
4053 }else if( pOrderBy==0 ){
drh6457a352013-06-21 00:35:37 +00004054 /* Try to ORDER BY the result set to make distinct processing easier */
drh4f402f22013-06-11 18:59:38 +00004055 pWInfo->wctrlFlags |= WHERE_DISTINCTBY;
drh6457a352013-06-21 00:35:37 +00004056 pWInfo->pOrderBy = pResultSet;
drh4f402f22013-06-11 18:59:38 +00004057 }
dan38cc40c2011-06-30 20:17:15 +00004058 }
4059
drhf1b5f5b2013-05-02 00:15:01 +00004060 /* Construct the WhereLoop objects */
drh3b48e8c2013-06-12 20:18:16 +00004061 WHERETRACE(0xffff,("*** Optimizer Start ***\n"));
drhc90713d2014-09-30 13:46:49 +00004062#if defined(WHERETRACE_ENABLED)
drhb121dd12015-06-06 18:30:17 +00004063 if( sqlite3WhereTrace & 0x100 ){ /* Display all terms of the WHERE clause */
drhc90713d2014-09-30 13:46:49 +00004064 int i;
4065 for(i=0; i<sWLB.pWC->nTerm; i++){
4066 whereTermPrint(&sWLB.pWC->a[i], i);
4067 }
4068 }
4069#endif
4070
drhb8a8e8a2013-06-10 19:12:39 +00004071 if( nTabList!=1 || whereShortCut(&sWLB)==0 ){
drh60c96cd2013-06-09 17:21:25 +00004072 rc = whereLoopAddAll(&sWLB);
4073 if( rc ) goto whereBeginError;
4074
drhb121dd12015-06-06 18:30:17 +00004075#ifdef WHERETRACE_ENABLED
4076 if( sqlite3WhereTrace ){ /* Display all of the WhereLoop objects */
drh60c96cd2013-06-09 17:21:25 +00004077 WhereLoop *p;
drhfd636c72013-06-21 02:05:06 +00004078 int i;
drhb121dd12015-06-06 18:30:17 +00004079 static const char zLabel[] = "0123456789abcdefghijklmnopqrstuvwyxz"
4080 "ABCDEFGHIJKLMNOPQRSTUVWYXZ";
drhfd636c72013-06-21 02:05:06 +00004081 for(p=pWInfo->pLoops, i=0; p; p=p->pNextLoop, i++){
4082 p->cId = zLabel[i%sizeof(zLabel)];
drhc1ba2e72013-10-28 19:03:21 +00004083 whereLoopPrint(p, sWLB.pWC);
drh60c96cd2013-06-09 17:21:25 +00004084 }
4085 }
4086#endif
4087
drh4f402f22013-06-11 18:59:38 +00004088 wherePathSolver(pWInfo, 0);
drh60c96cd2013-06-09 17:21:25 +00004089 if( db->mallocFailed ) goto whereBeginError;
4090 if( pWInfo->pOrderBy ){
drhc7f0d222013-06-19 03:27:12 +00004091 wherePathSolver(pWInfo, pWInfo->nRowOut+1);
drh60c96cd2013-06-09 17:21:25 +00004092 if( db->mallocFailed ) goto whereBeginError;
drha18f3d22013-05-08 03:05:41 +00004093 }
4094 }
drh60c96cd2013-06-09 17:21:25 +00004095 if( pWInfo->pOrderBy==0 && (db->flags & SQLITE_ReverseOrder)!=0 ){
drhd84ce352013-06-04 18:27:41 +00004096 pWInfo->revMask = (Bitmask)(-1);
drha50ef112013-05-22 02:06:59 +00004097 }
drh81186b42013-06-18 01:52:41 +00004098 if( pParse->nErr || NEVER(db->mallocFailed) ){
drh75b93402013-05-31 20:43:57 +00004099 goto whereBeginError;
4100 }
drhb121dd12015-06-06 18:30:17 +00004101#ifdef WHERETRACE_ENABLED
drha18f3d22013-05-08 03:05:41 +00004102 if( sqlite3WhereTrace ){
drh4f402f22013-06-11 18:59:38 +00004103 sqlite3DebugPrintf("---- Solution nRow=%d", pWInfo->nRowOut);
drhddba0c22014-03-18 20:33:42 +00004104 if( pWInfo->nOBSat>0 ){
4105 sqlite3DebugPrintf(" ORDERBY=%d,0x%llx", pWInfo->nOBSat, pWInfo->revMask);
drh319f6772013-05-14 15:31:07 +00004106 }
drh4f402f22013-06-11 18:59:38 +00004107 switch( pWInfo->eDistinct ){
4108 case WHERE_DISTINCT_UNIQUE: {
4109 sqlite3DebugPrintf(" DISTINCT=unique");
4110 break;
4111 }
4112 case WHERE_DISTINCT_ORDERED: {
4113 sqlite3DebugPrintf(" DISTINCT=ordered");
4114 break;
4115 }
4116 case WHERE_DISTINCT_UNORDERED: {
4117 sqlite3DebugPrintf(" DISTINCT=unordered");
4118 break;
4119 }
4120 }
4121 sqlite3DebugPrintf("\n");
drhfd636c72013-06-21 02:05:06 +00004122 for(ii=0; ii<pWInfo->nLevel; ii++){
drhc1ba2e72013-10-28 19:03:21 +00004123 whereLoopPrint(pWInfo->a[ii].pWLoop, sWLB.pWC);
drhf1b5f5b2013-05-02 00:15:01 +00004124 }
4125 }
4126#endif
drhfd636c72013-06-21 02:05:06 +00004127 /* Attempt to omit tables from the join that do not effect the result */
drh1031bd92013-06-22 15:44:26 +00004128 if( pWInfo->nLevel>=2
4129 && pResultSet!=0
4130 && OptimizationEnabled(db, SQLITE_OmitNoopJoin)
4131 ){
drh6c1f4ef2015-06-08 14:23:15 +00004132 Bitmask tabUsed = sqlite3WhereExprListUsage(pMaskSet, pResultSet);
4133 if( sWLB.pOrderBy ){
4134 tabUsed |= sqlite3WhereExprListUsage(pMaskSet, sWLB.pOrderBy);
4135 }
drhfd636c72013-06-21 02:05:06 +00004136 while( pWInfo->nLevel>=2 ){
drh9d5a5792013-06-28 13:43:33 +00004137 WhereTerm *pTerm, *pEnd;
drhfd636c72013-06-21 02:05:06 +00004138 pLoop = pWInfo->a[pWInfo->nLevel-1].pWLoop;
drh8a48b9c2015-08-19 15:20:00 +00004139 if( (pWInfo->pTabList->a[pLoop->iTab].fg.jointype & JT_LEFT)==0 ) break;
drhbc71b1d2013-06-21 02:15:48 +00004140 if( (wctrlFlags & WHERE_WANT_DISTINCT)==0
4141 && (pLoop->wsFlags & WHERE_ONEROW)==0
drhfd636c72013-06-21 02:05:06 +00004142 ){
drhfd636c72013-06-21 02:05:06 +00004143 break;
4144 }
drhbc71b1d2013-06-21 02:15:48 +00004145 if( (tabUsed & pLoop->maskSelf)!=0 ) break;
drh9d5a5792013-06-28 13:43:33 +00004146 pEnd = sWLB.pWC->a + sWLB.pWC->nTerm;
4147 for(pTerm=sWLB.pWC->a; pTerm<pEnd; pTerm++){
4148 if( (pTerm->prereqAll & pLoop->maskSelf)!=0
4149 && !ExprHasProperty(pTerm->pExpr, EP_FromJoin)
4150 ){
4151 break;
4152 }
4153 }
4154 if( pTerm<pEnd ) break;
drhbc71b1d2013-06-21 02:15:48 +00004155 WHERETRACE(0xffff, ("-> drop loop %c not used\n", pLoop->cId));
4156 pWInfo->nLevel--;
4157 nTabList--;
drhfd636c72013-06-21 02:05:06 +00004158 }
4159 }
drh3b48e8c2013-06-12 20:18:16 +00004160 WHERETRACE(0xffff,("*** Optimizer Finished ***\n"));
drh8e23daf2013-06-11 13:30:04 +00004161 pWInfo->pParse->nQueryLoop += pWInfo->nRowOut;
drhf1b5f5b2013-05-02 00:15:01 +00004162
drh08c88eb2008-04-10 13:33:18 +00004163 /* If the caller is an UPDATE or DELETE statement that is requesting
4164 ** to use a one-pass algorithm, determine if this is appropriate.
drh24b7fe92013-09-30 19:33:06 +00004165 ** The one-pass algorithm only works if the WHERE clause constrains
drhb121dd12015-06-06 18:30:17 +00004166 ** the statement to update or delete a single row.
drh08c88eb2008-04-10 13:33:18 +00004167 */
drh165be382008-12-05 02:36:33 +00004168 assert( (wctrlFlags & WHERE_ONEPASS_DESIRED)==0 || pWInfo->nLevel==1 );
drh3b48e8c2013-06-12 20:18:16 +00004169 if( (wctrlFlags & WHERE_ONEPASS_DESIRED)!=0
4170 && (pWInfo->a[0].pWLoop->wsFlags & WHERE_ONEROW)!=0 ){
drh08c88eb2008-04-10 13:33:18 +00004171 pWInfo->okOnePass = 1;
drh702ba9f2013-11-07 21:25:13 +00004172 if( HasRowid(pTabList->a[0].pTab) ){
4173 pWInfo->a[0].pWLoop->wsFlags &= ~WHERE_IDX_ONLY;
4174 }
drh08c88eb2008-04-10 13:33:18 +00004175 }
drheb04de32013-05-10 15:16:30 +00004176
drh9012bcb2004-12-19 00:11:35 +00004177 /* Open all tables in the pTabList and any indices selected for
4178 ** searching those tables.
4179 */
drh9cd1c992012-09-25 20:43:35 +00004180 for(ii=0, pLevel=pWInfo->a; ii<nTabList; ii++, pLevel++){
danielk1977da184232006-01-05 11:34:32 +00004181 Table *pTab; /* Table to open */
danielk1977da184232006-01-05 11:34:32 +00004182 int iDb; /* Index of database containing table/index */
drh56f1b992012-09-25 14:29:39 +00004183 struct SrcList_item *pTabItem;
drh9012bcb2004-12-19 00:11:35 +00004184
drh29dda4a2005-07-21 18:23:20 +00004185 pTabItem = &pTabList->a[pLevel->iFrom];
drh9012bcb2004-12-19 00:11:35 +00004186 pTab = pTabItem->pTab;
danielk1977595a5232009-07-24 17:58:53 +00004187 iDb = sqlite3SchemaToIndex(db, pTab->pSchema);
drh7ba39a92013-05-30 17:43:19 +00004188 pLoop = pLevel->pWLoop;
drh424aab82010-04-06 18:28:20 +00004189 if( (pTab->tabFlags & TF_Ephemeral)!=0 || pTab->pSelect ){
drh75bb9f52010-04-06 18:51:42 +00004190 /* Do nothing */
4191 }else
drh9eff6162006-06-12 21:59:13 +00004192#ifndef SQLITE_OMIT_VIRTUALTABLE
drh7ba39a92013-05-30 17:43:19 +00004193 if( (pLoop->wsFlags & WHERE_VIRTUALTABLE)!=0 ){
danielk1977595a5232009-07-24 17:58:53 +00004194 const char *pVTab = (const char *)sqlite3GetVTable(db, pTab);
danielk197793626f42006-06-20 13:07:27 +00004195 int iCur = pTabItem->iCursor;
danielk1977595a5232009-07-24 17:58:53 +00004196 sqlite3VdbeAddOp4(v, OP_VOpen, iCur, 0, 0, pVTab, P4_VTAB);
drhfc5e5462012-12-03 17:04:40 +00004197 }else if( IsVirtual(pTab) ){
4198 /* noop */
drh9eff6162006-06-12 21:59:13 +00004199 }else
4200#endif
drh7ba39a92013-05-30 17:43:19 +00004201 if( (pLoop->wsFlags & WHERE_IDX_ONLY)==0
drh9ef61f42011-10-07 14:40:59 +00004202 && (wctrlFlags & WHERE_OMIT_OPEN_CLOSE)==0 ){
drhfc8d4f92013-11-08 15:19:46 +00004203 int op = OP_OpenRead;
4204 if( pWInfo->okOnePass ){
4205 op = OP_OpenWrite;
4206 pWInfo->aiCurOnePass[0] = pTabItem->iCursor;
4207 };
drh08c88eb2008-04-10 13:33:18 +00004208 sqlite3OpenTable(pParse, pTabItem->iCursor, iDb, pTab, op);
drhfc8d4f92013-11-08 15:19:46 +00004209 assert( pTabItem->iCursor==pLevel->iTabCur );
drh7963b0e2013-06-17 21:37:40 +00004210 testcase( !pWInfo->okOnePass && pTab->nCol==BMS-1 );
4211 testcase( !pWInfo->okOnePass && pTab->nCol==BMS );
drhdd9930e2013-10-23 23:37:02 +00004212 if( !pWInfo->okOnePass && pTab->nCol<BMS && HasRowid(pTab) ){
danielk19779792eef2006-01-13 15:58:43 +00004213 Bitmask b = pTabItem->colUsed;
4214 int n = 0;
drh74161702006-02-24 02:53:49 +00004215 for(; b; b=b>>1, n++){}
drh8cff69d2009-11-12 19:59:44 +00004216 sqlite3VdbeChangeP4(v, sqlite3VdbeCurrentAddr(v)-1,
4217 SQLITE_INT_TO_PTR(n), P4_INT32);
danielk19779792eef2006-01-13 15:58:43 +00004218 assert( n<=pTab->nCol );
4219 }
drh97bae792015-06-05 15:59:57 +00004220#ifdef SQLITE_ENABLE_COLUMN_USED_MASK
4221 sqlite3VdbeAddOp4Dup8(v, OP_ColumnsUsed, pTabItem->iCursor, 0, 0,
4222 (const u8*)&pTabItem->colUsed, P4_INT64);
4223#endif
danielk1977c00da102006-01-07 13:21:04 +00004224 }else{
4225 sqlite3TableLock(pParse, iDb, pTab->tnum, 0, pTab->zName);
drh9012bcb2004-12-19 00:11:35 +00004226 }
drh7e47cb82013-05-31 17:55:27 +00004227 if( pLoop->wsFlags & WHERE_INDEXED ){
drh7ba39a92013-05-30 17:43:19 +00004228 Index *pIx = pLoop->u.btree.pIndex;
drhfc8d4f92013-11-08 15:19:46 +00004229 int iIndexCur;
4230 int op = OP_OpenRead;
drh4308e342013-11-11 16:55:52 +00004231 /* iIdxCur is always set if to a positive value if ONEPASS is possible */
4232 assert( iIdxCur!=0 || (pWInfo->wctrlFlags & WHERE_ONEPASS_DESIRED)==0 );
drh48dd1d82014-05-27 18:18:58 +00004233 if( !HasRowid(pTab) && IsPrimaryKeyIndex(pIx)
drha3bc66a2014-05-27 17:57:32 +00004234 && (wctrlFlags & WHERE_ONETABLE_ONLY)!=0
4235 ){
4236 /* This is one term of an OR-optimization using the PRIMARY KEY of a
4237 ** WITHOUT ROWID table. No need for a separate index */
4238 iIndexCur = pLevel->iTabCur;
4239 op = 0;
4240 }else if( pWInfo->okOnePass ){
drhfc8d4f92013-11-08 15:19:46 +00004241 Index *pJ = pTabItem->pTab->pIndex;
4242 iIndexCur = iIdxCur;
4243 assert( wctrlFlags & WHERE_ONEPASS_DESIRED );
4244 while( ALWAYS(pJ) && pJ!=pIx ){
4245 iIndexCur++;
4246 pJ = pJ->pNext;
4247 }
4248 op = OP_OpenWrite;
4249 pWInfo->aiCurOnePass[1] = iIndexCur;
4250 }else if( iIdxCur && (wctrlFlags & WHERE_ONETABLE_ONLY)!=0 ){
4251 iIndexCur = iIdxCur;
drh35263192014-07-22 20:02:19 +00004252 if( wctrlFlags & WHERE_REOPEN_IDX ) op = OP_ReopenIdx;
drhfc8d4f92013-11-08 15:19:46 +00004253 }else{
4254 iIndexCur = pParse->nTab++;
4255 }
4256 pLevel->iIdxCur = iIndexCur;
danielk1977da184232006-01-05 11:34:32 +00004257 assert( pIx->pSchema==pTab->pSchema );
drhb0367fb2012-08-25 02:11:13 +00004258 assert( iIndexCur>=0 );
drha3bc66a2014-05-27 17:57:32 +00004259 if( op ){
4260 sqlite3VdbeAddOp3(v, op, iIndexCur, pIx->tnum, iDb);
4261 sqlite3VdbeSetP4KeyInfo(pParse, pIx);
drhe0997b32015-03-20 14:57:50 +00004262 if( (pLoop->wsFlags & WHERE_CONSTRAINT)!=0
4263 && (pLoop->wsFlags & (WHERE_COLUMN_RANGE|WHERE_SKIPSCAN))==0
4264 && (pWInfo->wctrlFlags&WHERE_ORDERBY_MIN)==0
4265 ){
4266 sqlite3VdbeChangeP5(v, OPFLAG_SEEKEQ); /* Hint to COMDB2 */
4267 }
drha3bc66a2014-05-27 17:57:32 +00004268 VdbeComment((v, "%s", pIx->zName));
drh97bae792015-06-05 15:59:57 +00004269#ifdef SQLITE_ENABLE_COLUMN_USED_MASK
4270 {
4271 u64 colUsed = 0;
4272 int ii, jj;
4273 for(ii=0; ii<pIx->nColumn; ii++){
4274 jj = pIx->aiColumn[ii];
4275 if( jj<0 ) continue;
4276 if( jj>63 ) jj = 63;
4277 if( (pTabItem->colUsed & MASKBIT(jj))==0 ) continue;
4278 colUsed |= ((u64)1)<<(ii<63 ? ii : 63);
4279 }
4280 sqlite3VdbeAddOp4Dup8(v, OP_ColumnsUsed, iIndexCur, 0, 0,
4281 (u8*)&colUsed, P4_INT64);
4282 }
4283#endif /* SQLITE_ENABLE_COLUMN_USED_MASK */
drha3bc66a2014-05-27 17:57:32 +00004284 }
drh9012bcb2004-12-19 00:11:35 +00004285 }
drhaceb31b2014-02-08 01:40:27 +00004286 if( iDb>=0 ) sqlite3CodeVerifySchema(pParse, iDb);
drh9012bcb2004-12-19 00:11:35 +00004287 }
4288 pWInfo->iTop = sqlite3VdbeCurrentAddr(v);
drha21a64d2010-04-06 22:33:55 +00004289 if( db->mallocFailed ) goto whereBeginError;
drh9012bcb2004-12-19 00:11:35 +00004290
drh29dda4a2005-07-21 18:23:20 +00004291 /* Generate the code to do the search. Each iteration of the for
4292 ** loop below generates code for a single nested loop of the VM
4293 ** program.
drh75897232000-05-29 14:26:00 +00004294 */
drhfe05af82005-07-21 03:14:59 +00004295 notReady = ~(Bitmask)0;
drh9cd1c992012-09-25 20:43:35 +00004296 for(ii=0; ii<nTabList; ii++){
dan6f9702e2014-11-01 20:38:06 +00004297 int addrExplain;
4298 int wsFlags;
drh9cd1c992012-09-25 20:43:35 +00004299 pLevel = &pWInfo->a[ii];
dan6f9702e2014-11-01 20:38:06 +00004300 wsFlags = pLevel->pWLoop->wsFlags;
drhcc04afd2013-08-22 02:56:28 +00004301#ifndef SQLITE_OMIT_AUTOMATIC_INDEX
4302 if( (pLevel->pWLoop->wsFlags & WHERE_AUTO_INDEX)!=0 ){
4303 constructAutomaticIndex(pParse, &pWInfo->sWC,
4304 &pTabList->a[pLevel->iFrom], notReady, pLevel);
4305 if( db->mallocFailed ) goto whereBeginError;
4306 }
4307#endif
drh6f82e852015-06-06 20:12:09 +00004308 addrExplain = sqlite3WhereExplainOneScan(
dan6f9702e2014-11-01 20:38:06 +00004309 pParse, pTabList, pLevel, ii, pLevel->iFrom, wctrlFlags
4310 );
drhcc04afd2013-08-22 02:56:28 +00004311 pLevel->addrBody = sqlite3VdbeCurrentAddr(v);
drh6f82e852015-06-06 20:12:09 +00004312 notReady = sqlite3WhereCodeOneLoopStart(pWInfo, ii, notReady);
dan4a07e3d2010-11-09 14:48:59 +00004313 pWInfo->iContinue = pLevel->addrCont;
dan6f9702e2014-11-01 20:38:06 +00004314 if( (wsFlags&WHERE_MULTI_OR)==0 && (wctrlFlags&WHERE_ONETABLE_ONLY)==0 ){
drh6f82e852015-06-06 20:12:09 +00004315 sqlite3WhereAddScanStatus(v, pTabList, pLevel, addrExplain);
dan6f9702e2014-11-01 20:38:06 +00004316 }
drh75897232000-05-29 14:26:00 +00004317 }
drh7ec764a2005-07-21 03:48:20 +00004318
drh6fa978d2013-05-30 19:29:19 +00004319 /* Done. */
drh6bc69a22013-11-19 12:33:23 +00004320 VdbeModuleComment((v, "Begin WHERE-core"));
drh75897232000-05-29 14:26:00 +00004321 return pWInfo;
drhe23399f2005-07-22 00:31:39 +00004322
4323 /* Jump here if malloc fails */
danielk197785574e32008-10-06 05:32:18 +00004324whereBeginError:
drh8b307fb2010-04-06 15:57:05 +00004325 if( pWInfo ){
4326 pParse->nQueryLoop = pWInfo->savedNQueryLoop;
4327 whereInfoFree(db, pWInfo);
4328 }
drhe23399f2005-07-22 00:31:39 +00004329 return 0;
drh75897232000-05-29 14:26:00 +00004330}
4331
4332/*
drhc27a1ce2002-06-14 20:58:45 +00004333** Generate the end of the WHERE loop. See comments on
danielk19774adee202004-05-08 08:23:19 +00004334** sqlite3WhereBegin() for additional information.
drh75897232000-05-29 14:26:00 +00004335*/
danielk19774adee202004-05-08 08:23:19 +00004336void sqlite3WhereEnd(WhereInfo *pWInfo){
drh633e6d52008-07-28 19:34:53 +00004337 Parse *pParse = pWInfo->pParse;
4338 Vdbe *v = pParse->pVdbe;
drh19a775c2000-06-05 18:54:46 +00004339 int i;
drh6b563442001-11-07 16:48:26 +00004340 WhereLevel *pLevel;
drh7ba39a92013-05-30 17:43:19 +00004341 WhereLoop *pLoop;
drhad3cab52002-05-24 02:04:32 +00004342 SrcList *pTabList = pWInfo->pTabList;
drh633e6d52008-07-28 19:34:53 +00004343 sqlite3 *db = pParse->db;
drh19a775c2000-06-05 18:54:46 +00004344
drh9012bcb2004-12-19 00:11:35 +00004345 /* Generate loop termination code.
4346 */
drh6bc69a22013-11-19 12:33:23 +00004347 VdbeModuleComment((v, "End WHERE-core"));
drhceea3322009-04-23 13:22:42 +00004348 sqlite3ExprCacheClear(pParse);
drhc01a3c12009-12-16 22:10:49 +00004349 for(i=pWInfo->nLevel-1; i>=0; i--){
drhcd8629e2013-11-13 12:27:25 +00004350 int addr;
drh6b563442001-11-07 16:48:26 +00004351 pLevel = &pWInfo->a[i];
drh7ba39a92013-05-30 17:43:19 +00004352 pLoop = pLevel->pWLoop;
drhb3190c12008-12-08 21:37:14 +00004353 sqlite3VdbeResolveLabel(v, pLevel->addrCont);
drh6b563442001-11-07 16:48:26 +00004354 if( pLevel->op!=OP_Noop ){
drhe39a7322014-02-03 14:04:11 +00004355 sqlite3VdbeAddOp3(v, pLevel->op, pLevel->p1, pLevel->p2, pLevel->p3);
drhd1d38482008-10-07 23:46:38 +00004356 sqlite3VdbeChangeP5(v, pLevel->p5);
drh688852a2014-02-17 22:40:43 +00004357 VdbeCoverage(v);
drh7d176102014-02-18 03:07:12 +00004358 VdbeCoverageIf(v, pLevel->op==OP_Next);
4359 VdbeCoverageIf(v, pLevel->op==OP_Prev);
4360 VdbeCoverageIf(v, pLevel->op==OP_VNext);
drh19a775c2000-06-05 18:54:46 +00004361 }
drh7ba39a92013-05-30 17:43:19 +00004362 if( pLoop->wsFlags & WHERE_IN_ABLE && pLevel->u.in.nIn>0 ){
drh72e8fa42007-03-28 14:30:06 +00004363 struct InLoop *pIn;
drhe23399f2005-07-22 00:31:39 +00004364 int j;
drhb3190c12008-12-08 21:37:14 +00004365 sqlite3VdbeResolveLabel(v, pLevel->addrNxt);
drh111a6a72008-12-21 03:51:16 +00004366 for(j=pLevel->u.in.nIn, pIn=&pLevel->u.in.aInLoop[j-1]; j>0; j--, pIn--){
drhb3190c12008-12-08 21:37:14 +00004367 sqlite3VdbeJumpHere(v, pIn->addrInTop+1);
drh2d96b932013-02-08 18:48:23 +00004368 sqlite3VdbeAddOp2(v, pIn->eEndLoopOp, pIn->iCur, pIn->addrInTop);
drh688852a2014-02-17 22:40:43 +00004369 VdbeCoverage(v);
drh7d176102014-02-18 03:07:12 +00004370 VdbeCoverageIf(v, pIn->eEndLoopOp==OP_PrevIfOpen);
4371 VdbeCoverageIf(v, pIn->eEndLoopOp==OP_NextIfOpen);
drhb3190c12008-12-08 21:37:14 +00004372 sqlite3VdbeJumpHere(v, pIn->addrInTop-1);
drhe23399f2005-07-22 00:31:39 +00004373 }
drhd99f7062002-06-08 23:25:08 +00004374 }
drhb3190c12008-12-08 21:37:14 +00004375 sqlite3VdbeResolveLabel(v, pLevel->addrBrk);
drhcd8629e2013-11-13 12:27:25 +00004376 if( pLevel->addrSkip ){
drhcd8629e2013-11-13 12:27:25 +00004377 sqlite3VdbeAddOp2(v, OP_Goto, 0, pLevel->addrSkip);
drhe084f402013-11-13 17:24:38 +00004378 VdbeComment((v, "next skip-scan on %s", pLoop->u.btree.pIndex->zName));
drh2e5ef4e2013-11-13 16:58:54 +00004379 sqlite3VdbeJumpHere(v, pLevel->addrSkip);
4380 sqlite3VdbeJumpHere(v, pLevel->addrSkip-2);
drhcd8629e2013-11-13 12:27:25 +00004381 }
drhf07cf6e2015-03-06 16:45:16 +00004382 if( pLevel->addrLikeRep ){
drhb7c60ba2015-03-07 02:51:59 +00004383 int op;
4384 if( sqlite3VdbeGetOp(v, pLevel->addrLikeRep-1)->p1 ){
4385 op = OP_DecrJumpZero;
4386 }else{
4387 op = OP_JumpZeroIncr;
4388 }
4389 sqlite3VdbeAddOp2(v, op, pLevel->iLikeRepCntr, pLevel->addrLikeRep);
drhf07cf6e2015-03-06 16:45:16 +00004390 VdbeCoverage(v);
drhf07cf6e2015-03-06 16:45:16 +00004391 }
drhad2d8302002-05-24 20:31:36 +00004392 if( pLevel->iLeftJoin ){
drh688852a2014-02-17 22:40:43 +00004393 addr = sqlite3VdbeAddOp1(v, OP_IfPos, pLevel->iLeftJoin); VdbeCoverage(v);
drh7ba39a92013-05-30 17:43:19 +00004394 assert( (pLoop->wsFlags & WHERE_IDX_ONLY)==0
4395 || (pLoop->wsFlags & WHERE_INDEXED)!=0 );
4396 if( (pLoop->wsFlags & WHERE_IDX_ONLY)==0 ){
drh35451c62009-11-12 04:26:39 +00004397 sqlite3VdbeAddOp1(v, OP_NullRow, pTabList->a[i].iCursor);
4398 }
drh76f4cfb2013-05-31 18:20:52 +00004399 if( pLoop->wsFlags & WHERE_INDEXED ){
drh3c84ddf2008-01-09 02:15:38 +00004400 sqlite3VdbeAddOp1(v, OP_NullRow, pLevel->iIdxCur);
drh7f09b3e2002-08-13 13:15:49 +00004401 }
drh336a5302009-04-24 15:46:21 +00004402 if( pLevel->op==OP_Return ){
4403 sqlite3VdbeAddOp2(v, OP_Gosub, pLevel->p1, pLevel->addrFirst);
4404 }else{
4405 sqlite3VdbeAddOp2(v, OP_Goto, 0, pLevel->addrFirst);
4406 }
drhd654be82005-09-20 17:42:23 +00004407 sqlite3VdbeJumpHere(v, addr);
drhad2d8302002-05-24 20:31:36 +00004408 }
drh6bc69a22013-11-19 12:33:23 +00004409 VdbeModuleComment((v, "End WHERE-loop%d: %s", i,
drhfc8d4f92013-11-08 15:19:46 +00004410 pWInfo->pTabList->a[pLevel->iFrom].pTab->zName));
drh19a775c2000-06-05 18:54:46 +00004411 }
drh9012bcb2004-12-19 00:11:35 +00004412
4413 /* The "break" point is here, just past the end of the outer loop.
4414 ** Set it.
4415 */
danielk19774adee202004-05-08 08:23:19 +00004416 sqlite3VdbeResolveLabel(v, pWInfo->iBreak);
drh9012bcb2004-12-19 00:11:35 +00004417
drhfd636c72013-06-21 02:05:06 +00004418 assert( pWInfo->nLevel<=pTabList->nSrc );
drhc01a3c12009-12-16 22:10:49 +00004419 for(i=0, pLevel=pWInfo->a; i<pWInfo->nLevel; i++, pLevel++){
drh5f612292014-02-08 23:20:32 +00004420 int k, last;
4421 VdbeOp *pOp;
danbfca6a42012-08-24 10:52:35 +00004422 Index *pIdx = 0;
drh29dda4a2005-07-21 18:23:20 +00004423 struct SrcList_item *pTabItem = &pTabList->a[pLevel->iFrom];
drh9012bcb2004-12-19 00:11:35 +00004424 Table *pTab = pTabItem->pTab;
drh5cf590c2003-04-24 01:45:04 +00004425 assert( pTab!=0 );
drh7ba39a92013-05-30 17:43:19 +00004426 pLoop = pLevel->pWLoop;
drhfc8d4f92013-11-08 15:19:46 +00004427
drh5f612292014-02-08 23:20:32 +00004428 /* For a co-routine, change all OP_Column references to the table of
drh7b3aa082015-05-29 13:55:33 +00004429 ** the co-routine into OP_Copy of result contained in a register.
drh5f612292014-02-08 23:20:32 +00004430 ** OP_Rowid becomes OP_Null.
4431 */
drh8a48b9c2015-08-19 15:20:00 +00004432 if( pTabItem->fg.viaCoroutine && !db->mallocFailed ){
drh7b3aa082015-05-29 13:55:33 +00004433 translateColumnToCopy(v, pLevel->addrBody, pLevel->iTabCur,
4434 pTabItem->regResult);
drh5f612292014-02-08 23:20:32 +00004435 continue;
4436 }
4437
drhfc8d4f92013-11-08 15:19:46 +00004438 /* Close all of the cursors that were opened by sqlite3WhereBegin.
4439 ** Except, do not close cursors that will be reused by the OR optimization
4440 ** (WHERE_OMIT_OPEN_CLOSE). And do not close the OP_OpenWrite cursors
4441 ** created for the ONEPASS optimization.
4442 */
drh4139c992010-04-07 14:59:45 +00004443 if( (pTab->tabFlags & TF_Ephemeral)==0
4444 && pTab->pSelect==0
drh9ef61f42011-10-07 14:40:59 +00004445 && (pWInfo->wctrlFlags & WHERE_OMIT_OPEN_CLOSE)==0
drh4139c992010-04-07 14:59:45 +00004446 ){
drh7ba39a92013-05-30 17:43:19 +00004447 int ws = pLoop->wsFlags;
drh8b307fb2010-04-06 15:57:05 +00004448 if( !pWInfo->okOnePass && (ws & WHERE_IDX_ONLY)==0 ){
drh6df2acd2008-12-28 16:55:25 +00004449 sqlite3VdbeAddOp1(v, OP_Close, pTabItem->iCursor);
4450 }
drhfc8d4f92013-11-08 15:19:46 +00004451 if( (ws & WHERE_INDEXED)!=0
4452 && (ws & (WHERE_IPK|WHERE_AUTO_INDEX))==0
4453 && pLevel->iIdxCur!=pWInfo->aiCurOnePass[1]
4454 ){
drh6df2acd2008-12-28 16:55:25 +00004455 sqlite3VdbeAddOp1(v, OP_Close, pLevel->iIdxCur);
4456 }
drh9012bcb2004-12-19 00:11:35 +00004457 }
4458
drhf0030762013-06-14 13:27:01 +00004459 /* If this scan uses an index, make VDBE code substitutions to read data
4460 ** from the index instead of from the table where possible. In some cases
4461 ** this optimization prevents the table from ever being read, which can
4462 ** yield a significant performance boost.
drh9012bcb2004-12-19 00:11:35 +00004463 **
4464 ** Calls to the code generator in between sqlite3WhereBegin and
4465 ** sqlite3WhereEnd will have created code that references the table
4466 ** directly. This loop scans all that code looking for opcodes
4467 ** that reference the table and converts them into opcodes that
4468 ** reference the index.
4469 */
drh7ba39a92013-05-30 17:43:19 +00004470 if( pLoop->wsFlags & (WHERE_INDEXED|WHERE_IDX_ONLY) ){
4471 pIdx = pLoop->u.btree.pIndex;
4472 }else if( pLoop->wsFlags & WHERE_MULTI_OR ){
drhd40e2082012-08-24 23:24:15 +00004473 pIdx = pLevel->u.pCovidx;
danbfca6a42012-08-24 10:52:35 +00004474 }
drh7ba39a92013-05-30 17:43:19 +00004475 if( pIdx && !db->mallocFailed ){
drh9012bcb2004-12-19 00:11:35 +00004476 last = sqlite3VdbeCurrentAddr(v);
drhcc04afd2013-08-22 02:56:28 +00004477 k = pLevel->addrBody;
4478 pOp = sqlite3VdbeGetOp(v, k);
4479 for(; k<last; k++, pOp++){
drh9012bcb2004-12-19 00:11:35 +00004480 if( pOp->p1!=pLevel->iTabCur ) continue;
4481 if( pOp->opcode==OP_Column ){
drhee0ec8e2013-10-31 17:38:01 +00004482 int x = pOp->p2;
drh511717c2013-11-08 17:13:23 +00004483 assert( pIdx->pTable==pTab );
drhee0ec8e2013-10-31 17:38:01 +00004484 if( !HasRowid(pTab) ){
4485 Index *pPk = sqlite3PrimaryKeyIndex(pTab);
4486 x = pPk->aiColumn[x];
4487 }
4488 x = sqlite3ColumnOfIndex(pIdx, x);
drh44156282013-10-23 22:23:03 +00004489 if( x>=0 ){
4490 pOp->p2 = x;
4491 pOp->p1 = pLevel->iIdxCur;
drh9012bcb2004-12-19 00:11:35 +00004492 }
drh44156282013-10-23 22:23:03 +00004493 assert( (pLoop->wsFlags & WHERE_IDX_ONLY)==0 || x>=0 );
drhf0863fe2005-06-12 21:35:51 +00004494 }else if( pOp->opcode==OP_Rowid ){
drh9012bcb2004-12-19 00:11:35 +00004495 pOp->p1 = pLevel->iIdxCur;
drhf0863fe2005-06-12 21:35:51 +00004496 pOp->opcode = OP_IdxRowid;
drh9012bcb2004-12-19 00:11:35 +00004497 }
4498 }
drh6b563442001-11-07 16:48:26 +00004499 }
drh19a775c2000-06-05 18:54:46 +00004500 }
drh9012bcb2004-12-19 00:11:35 +00004501
4502 /* Final cleanup
4503 */
drhf12cde52010-04-08 17:28:00 +00004504 pParse->nQueryLoop = pWInfo->savedNQueryLoop;
4505 whereInfoFree(db, pWInfo);
drh75897232000-05-29 14:26:00 +00004506 return;
4507}