SQLite: Changes On Branch experimental-costs

Many hyperlinks are disabled.
Use anonymous login to enable hyperlinks.

Changes In Branch experimental-costs Excluding Merge-Ins

This is equivalent to a diff from af2cbe64ad to 05e6e16cb2

2014-04-30
15:22		Modify the way the costs of various query plans are estimated. If the user supplies a likelihood() value (or equivalent) on an indexed WHERE constraint, use it to estimate the number of index rows visited. (check-in: 90e3667647 user: dan tags: trunk)
15:00		Add text to the header comment of whereLoopAddBtree() describing how the costs of various b-tree loops are estimated. (Closed-Leaf check-in: 05e6e16cb2 user: dan tags: experimental-costs)
14:53		Update a couple of test cases to account for the fact that this branch prefers an index scan and partial sort over a full-table scan and full external sort. (check-in: 9b975bf33c user: dan tags: experimental-costs)
2014-04-29
16:46		Merge trunk changes into this branch. (check-in: d74299f037 user: dan tags: experimental-costs)
2014-04-28
18:02		Merge all recent trunk enhancements and fixes into the sessions branch. (check-in: e158812c34 user: drh tags: sessions)
17:56		Add the sqlite3_rtree_query_callback() API to the RTree virtual table. (Cherrypick from the sessions branch.) (check-in: af2cbe64ad user: drh tags: trunk)
17:51		Add the sqlite3_rtree_query_callback() API to the RTree virtual table. (check-in: 3dca280935 user: drh tags: sessions)
2014-04-26
19:23		Update requirements marks to fix typos in the requirements text. No changes to code. (check-in: f5a2636581 user: drh tags: trunk)

Changes to src/analyze.c.

Changes to src/build.c.

Changes to src/pragma.c.

Changes to src/select.c.

Changes to src/sqliteInt.h.

Changes to src/util.c.

Changes to src/where.c.

Changes to src/whereInt.h.

Changes to test/analyze3.test.

Changes to test/analyze9.test.

Changes to test/autoindex1.test.

Added test/cost.test.

Changes to test/eqp.test.

Changes to test/index6.test.

Changes to test/orderby5.test.

Changes to test/skipscan2.test.

Changes to test/unordered.test.

Changes to test/where3.test.

Changes to test/whereG.test.

Changes to tool/logest.c.

︙			︙
1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 ~~1392~~ 1393 1394 1395 1396 1397 1398 1399	list of space separated integers. Read the first nOut of these into the array aOut[]. / static void decodeIntArray( char zIntArray, /* String containing int array to decode / int nOut, / Number of slots in aOut[] / tRowcnt aOut, /* Store integers here / Index pIndex /* Handle extra flags for this index, if not NULL / ){ char z = zIntArray; int c; int i; tRowcnt v; #ifdef SQLITE_ENABLE_STAT3_OR_STAT4 if( z==0 ) z = ""; #else if( NEVER(z==0) ) z = ""; #endif for(i=0; z && i<nOut; i++){ v = 0; while( (c=z[0])>='0' && c<='9' ){ v = v10 + c - '0'; z++; } ~~aOut[i] = v;~~ if( *z==' ' ) z++; } #ifndef SQLITE_ENABLE_STAT3_OR_STAT4 assert( pIndex!=0 ); #else if( pIndex ) #endif	> > \| > > >	1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404	list of space separated integers. Read the first nOut of these into the array aOut[]. / static void decodeIntArray( char zIntArray, /* String containing int array to decode / int nOut, / Number of slots in aOut[] / tRowcnt aOut, /* Store integers here / LogEst aLog, /* Or, if aOut==0, here / Index pIndex /* Handle extra flags for this index, if not NULL / ){ char z = zIntArray; int c; int i; tRowcnt v; #ifdef SQLITE_ENABLE_STAT3_OR_STAT4 if( z==0 ) z = ""; #else if( NEVER(z==0) ) z = ""; #endif for(i=0; z && i<nOut; i++){ v = 0; while( (c=z[0])>='0' && c<='9' ){ v = v10 + c - '0'; z++; } if( aOut ){ aOut[i] = v; }else{ aLog[i] = sqlite3LogEst(v); } if( *z==' ' ) z++; } #ifndef SQLITE_ENABLE_STAT3_OR_STAT4 assert( pIndex!=0 ); #else if( pIndex ) #endif
︙			︙
1441 1442 1443 1444 1445 1446 1447 ~~1448 1449~~ 1450 1451 1452 ~~1453~~ 1454 1455 1456 1457 1458 1459 1460	pIndex = sqlite3PrimaryKeyIndex(pTable); }else{ pIndex = sqlite3FindIndex(pInfo->db, argv[1], pInfo->zDatabase); } z = argv[2]; if( pIndex ){ ~~decodeIntArray((char)z, pIndex->nKeyCol+1, pIndex->aiRowEst, pIndex); if( pIndex->pPartIdxWhere==0 ) pTable->nRowEst = pIndex->aiRowEst[0];~~ }else{ Index fakeIdx; fakeIdx.szIdxRow = pTable->szTabRow; ~~decodeIntArray((char)z, 1, &pTable->nRowEst, &fakeIdx);~~ pTable->szTabRow = fakeIdx.szIdxRow; } return 0; } /*	\| \| \|	1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465	pIndex = sqlite3PrimaryKeyIndex(pTable); }else{ pIndex = sqlite3FindIndex(pInfo->db, argv[1], pInfo->zDatabase); } z = argv[2]; if( pIndex ){ decodeIntArray((char)z, pIndex->nKeyCol+1, 0, pIndex->aiRowLogEst, pIndex); if( pIndex->pPartIdxWhere==0 ) pTable->nRowLogEst = pIndex->aiRowLogEst[0]; }else{ Index fakeIdx; fakeIdx.szIdxRow = pTable->szTabRow; decodeIntArray((char)z, 1, 0, &pTable->nRowLogEst, &fakeIdx); pTable->szTabRow = fakeIdx.szIdxRow; } return 0; } /*
︙			︙
1638 1639 1640 1641 1642 1643 1644 ~~1645 1646 1647~~ 1648 1649 1650 1651 1652 1653 1654	nCol = pIdx->nSampleCol; if( bStat3 && nCol>1 ) continue; if( pIdx!=pPrevIdx ){ initAvgEq(pPrevIdx); pPrevIdx = pIdx; } pSample = &pIdx->aSample[pIdx->nSample]; decodeIntArray((char)sqlite3_column_text(pStmt,1), ~~nCol,~~ pSample->anEq, 0); decodeIntArray((char)sqlite3_column_text(pStmt,2), ~~nCol,~~ pSample->anLt, 0); decodeIntArray((char)sqlite3_column_text(pStmt,3), ~~nCol,~~ pSample->anDLt,0); / Take a copy of the sample. Add two 0x00 bytes the end of the buffer. This is in case the sample record is corrupted. In that case, the sqlite3VdbeRecordCompare() may read up to two varints past the end of the allocated buffer before it realizes it is dealing with a corrupt record. Adding the two 0x00 bytes prevents this from causing ** a buffer overread. */	\| \| \|	1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659	nCol = pIdx->nSampleCol; if( bStat3 && nCol>1 ) continue; if( pIdx!=pPrevIdx ){ initAvgEq(pPrevIdx); pPrevIdx = pIdx; } pSample = &pIdx->aSample[pIdx->nSample]; decodeIntArray((char)sqlite3_column_text(pStmt,1),nCol,pSample->anEq,0,0); decodeIntArray((char)sqlite3_column_text(pStmt,2),nCol,pSample->anLt,0,0); decodeIntArray((char)sqlite3_column_text(pStmt,3),nCol,pSample->anDLt,0,0); / Take a copy of the sample. Add two 0x00 bytes the end of the buffer. This is in case the sample record is corrupted. In that case, the sqlite3VdbeRecordCompare() may read up to two varints past the end of the allocated buffer before it realizes it is dealing with a corrupt record. Adding the two 0x00 bytes prevents this from causing ** a buffer overread. */
︙			︙

︙			︙
901 902 903 904 905 906 907 ~~908~~ 909 910 911 912 913 914 915	pParse->nErr++; goto begin_table_error; } pTable->zName = zName; pTable->iPKey = -1; pTable->pSchema = db->aDb[iDb].pSchema; pTable->nRef = 1; ~~pTable->nRowEst = 1048576;~~ assert( pParse->pNewTable==0 ); pParse->pNewTable = pTable; /* If this is the magic sqlite_sequence table used by autoincrement, then record a pointer to this table in the main database structure so that INSERT can find the table easily. */	\|	901 902 903 904 905 906 907 908 909 910 911 912 913 914 915	pParse->nErr++; goto begin_table_error; } pTable->zName = zName; pTable->iPKey = -1; pTable->pSchema = db->aDb[iDb].pSchema; pTable->nRef = 1; pTable->nRowLogEst = 200; assert( 200==sqlite3LogEst(1048576) ); assert( pParse->pNewTable==0 ); pParse->pNewTable = pTable; /* If this is the magic sqlite_sequence table used by autoincrement, then record a pointer to this table in the main database structure so that INSERT can find the table easily. */
︙			︙
2726 2727 2728 2729 2730 2731 2732 ~~2733~~ 2734 2735 2736 2737 2738 ~~2739 2740 2741~~ 2742 2743 2744 2745 2746 2747 2748	char *ppExtra / Pointer to the "extra" space / ){ Index p; /* Allocated index object / int nByte; / Bytes of space for Index object + arrays / nByte = ROUND8(sizeof(Index)) + / Index structure / ROUND8(sizeof(char)nCol) + / Index.azColl / ~~ROUND8(sizeof(~~tRowcn~~t)(nCol+1) + /* Index.aiRowEst /~~ sizeof(i16)nCol + /* Index.aiColumn / sizeof(u8)nCol); /* Index.aSortOrder / p = sqlite3DbMallocZero(db, nByte + nExtra); if( p ){ char pExtra = ((char)p)+ROUND8(sizeof(Index)); p->azColl = (char)pExtra; pExtra += ROUND8(sizeof(char)nCol); p->aiRowEst = (~~tRowcn~~t)pExtra; pExtra += sizeof(~~tRowcn~~t)(nCol+1); p->aiColumn = (i16)pExtra; pExtra += sizeof(i16)nCol; p->aSortOrder = (u8)pExtra; p->nColumn = nCol; p->nKeyCol = nCol - 1; ppExtra = ((char)p) + nByte; } return p; }	\| \| \| \|	2726 2727 2728 2729 2730 2731 2732 2733 2734 2735 2736 2737 2738 2739 2740 2741 2742 2743 2744 2745 2746 2747 2748	char *ppExtra / Pointer to the "extra" space / ){ Index p; /* Allocated index object / int nByte; / Bytes of space for Index object + arrays / nByte = ROUND8(sizeof(Index)) + / Index structure / ROUND8(sizeof(char)nCol) + / Index.azColl / ROUND8(sizeof(LogEst)(nCol+1) + /* Index.aiRowLogEst / sizeof(i16)nCol + /* Index.aiColumn / sizeof(u8)nCol); /* Index.aSortOrder / p = sqlite3DbMallocZero(db, nByte + nExtra); if( p ){ char pExtra = ((char)p)+ROUND8(sizeof(Index)); p->azColl = (char)pExtra; pExtra += ROUND8(sizeof(char)nCol); p->aiRowLogEst = (LogEst)pExtra; pExtra += sizeof(LogEst)(nCol+1); p->aiColumn = (i16)pExtra; pExtra += sizeof(i16)nCol; p->aSortOrder = (u8)pExtra; p->nColumn = nCol; p->nKeyCol = nCol - 1; ppExtra = ((char)p) + nByte; } return p; }
︙			︙
2964 2965 2966 2967 2968 2969 2970 ~~2971~~ 2972 2973 2974 2975 2976 2977 2978	nName = sqlite3Strlen30(zName); nExtraCol = pPk ? pPk->nKeyCol : 1; pIndex = sqlite3AllocateIndexObject(db, pList->nExpr + nExtraCol, nName + nExtra + 1, &zExtra); if( db->mallocFailed ){ goto exit_create_index; } ~~assert( EIGHT_BYTE_ALIGNMENT(pIndex->aiRowEst) );~~ assert( EIGHT_BYTE_ALIGNMENT(pIndex->azColl) ); pIndex->zName = zExtra; zExtra += nName + 1; memcpy(pIndex->zName, zName, nName+1); pIndex->pTable = pTab; pIndex->onError = (u8)onError; pIndex->uniqNotNull = onError!=OE_None;	\|	2964 2965 2966 2967 2968 2969 2970 2971 2972 2973 2974 2975 2976 2977 2978	nName = sqlite3Strlen30(zName); nExtraCol = pPk ? pPk->nKeyCol : 1; pIndex = sqlite3AllocateIndexObject(db, pList->nExpr + nExtraCol, nName + nExtra + 1, &zExtra); if( db->mallocFailed ){ goto exit_create_index; } assert( EIGHT_BYTE_ALIGNMENT(pIndex->aiRowLogEst) ); assert( EIGHT_BYTE_ALIGNMENT(pIndex->azColl) ); pIndex->zName = zExtra; zExtra += nName + 1; memcpy(pIndex->zName, zName, nName+1); pIndex->pTable = pTab; pIndex->onError = (u8)onError; pIndex->uniqNotNull = onError!=OE_None;
︙			︙
3245 3246 3247 3248 3249 3250 3251 ~~3252~~ 3253 3254 3255 3256 3257 3258 3259 3260 3261 3262 ~~3263~~ 3264 ~~3265 3266~~ ~~3267 3268 3269~~ ~~3270 3271 3272~~ 3273 ~~3274 3275 3276~~ 3277 3278 3279 3280 3281 3282 3283	Fill the Index.aiRowEst[] array with default information - information to be used when we have not run the ANALYZE command. aiRowEst[0] is suppose to contain the number of elements in the index. Since we do not know, guess 1 million. aiRowEst[1] is an estimate of the number of rows in the table that match any particular value of the first column of the index. aiRowEst[2] is an estimate of the number of rows that match any particular combiniation of the first 2 columns ** of the index. And so forth. It must always be the case that * aiRowEst[N]<=aiRowEst[N-1] aiRowEst[N]>=1 Apart from that, we have little to go on besides intuition as to how aiRowEst[] should be initialized. The numbers generated here are based on typical values found in actual indices. / void sqlite3DefaultRowEst(Index pIdx){ ~~~~tRowcn~~t a = pIdx->aiRowEst;~~ int i; ~~tRowcnt n;~~ ~~assert( a!=0 );~~ ~~a[0] = pIdx->pTable->nRowEst; if( a[0]<10 ) a[0] = 10; ~~n = 10;~~~~ ~~for(i=1; i<=pIdx->nKeyCol; i++){ a[i] = n; ~~if( n>5 ) n--;~~~~ } ~~~~if( pIdx->onError!=OE_None ){~~ ~~a[pIdx->nKeyCol] = 1;~~ }~~ } / This routine will drop an existing named index. This routine implements the DROP INDEX statement. / void sqlite3DropIndex(Parse pParse, SrcList *pName, int ifExists){	\| > > \| > \| < > > > \| \| \| > > > \| \| < < < \| > >	3245 3246 3247 3248 3249 3250 3251 3252 3253 3254 3255 3256 3257 3258 3259 3260 3261 3262 3263 3264 3265 3266 3267 3268 3269 3270 3271 3272 3273 3274 3275 3276 3277 3278 3279 3280 3281 3282 3283 3284 3285 3286 3287 3288 3289 3290	Fill the Index.aiRowEst[] array with default information - information to be used when we have not run the ANALYZE command. aiRowEst[0] is suppose to contain the number of elements in the index. Since we do not know, guess 1 million. aiRowEst[1] is an estimate of the number of rows in the table that match any particular value of the first column of the index. aiRowEst[2] is an estimate of the number of rows that match any particular combination of the first 2 columns ** of the index. And so forth. It must always be the case that * aiRowEst[N]<=aiRowEst[N-1] aiRowEst[N]>=1 Apart from that, we have little to go on besides intuition as to how aiRowEst[] should be initialized. The numbers generated here are based on typical values found in actual indices. / void sqlite3DefaultRowEst(Index pIdx){ /* 10, 9, 8, 7, 6 / LogEst aVal[] = { 33, 32, 30, 28, 26 }; LogEst a = pIdx->aiRowLogEst; int nCopy = MIN(ArraySize(aVal), pIdx->nKeyCol); int i; /* Set the first entry (number of rows in the index) to the estimated number of rows in the table. Or 10, if the estimated number of rows in the table is less than that. / a[0] = pIdx->pTable->nRowLogEst; if( a[0]<33 ) a[0] = 33; assert( 33==sqlite3LogEst(10) ); / Estimate that a[1] is 10, a[2] is 9, a[3] is 8, a[4] is 7, a[5] is ** 6 and each subsequent value (if any) is 5. / memcpy(&a[1], aVal, nCopysizeof(LogEst)); for(i=nCopy+1; i<=pIdx->nKeyCol; i++){ a[i] = 23; assert( 23==sqlite3LogEst(5) ); } assert( 0==sqlite3LogEst(1) ); if( pIdx->onError!=OE_None ) a[pIdx->nKeyCol] = 0; } /* This routine will drop an existing named index. This routine implements the DROP INDEX statement. / void sqlite3DropIndex(Parse pParse, SrcList *pName, int ifExists){
︙			︙

︙			︙
1686 1687 1688 1689 1690 1691 1692 ~~1693~~ 1694 1695 1696 1697 1698 1699 1700	return 0; } /* The sqlite3ResultSetOfSelect() is only used n contexts where lookaside ** is disabled */ assert( db->lookaside.bEnabled==0 ); pTab->nRef = 1; pTab->zName = 0; ~~pTab->nRowEst = 1048576;~~ selectColumnsFromExprList(pParse, pSelect->pEList, &pTab->nCol, &pTab->aCol); selectAddColumnTypeAndCollation(pParse, pTab, pSelect); pTab->iPKey = -1; if( db->mallocFailed ){ sqlite3DeleteTable(db, pTab); return 0; }	\|	1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700	return 0; } /* The sqlite3ResultSetOfSelect() is only used n contexts where lookaside ** is disabled */ assert( db->lookaside.bEnabled==0 ); pTab->nRef = 1; pTab->zName = 0; pTab->nRowLogEst = 200; assert( 200==sqlite3LogEst(1048576) ); selectColumnsFromExprList(pParse, pSelect->pEList, &pTab->nCol, &pTab->aCol); selectAddColumnTypeAndCollation(pParse, pTab, pSelect); pTab->iPKey = -1; if( db->mallocFailed ){ sqlite3DeleteTable(db, pTab); return 0; }
︙			︙
3825 3826 3827 3828 3829 3830 3831 ~~3832~~ 3833 3834 3835 3836 3837 3838 3839	assert( pFrom->pTab==0 ); pFrom->pTab = pTab = sqlite3DbMallocZero(db, sizeof(Table)); if( pTab==0 ) return WRC_Abort; pTab->nRef = 1; pTab->zName = sqlite3DbStrDup(db, pCte->zName); pTab->iPKey = -1; ~~pTab->nRowEst = 1048576;~~ pTab->tabFlags \|= TF_Ephemeral; pFrom->pSelect = sqlite3SelectDup(db, pCte->pSelect, 0); if( db->mallocFailed ) return SQLITE_NOMEM; assert( pFrom->pSelect ); /* Check if this is a recursive CTE. */ pSel = pFrom->pSelect;	\|	3825 3826 3827 3828 3829 3830 3831 3832 3833 3834 3835 3836 3837 3838 3839	assert( pFrom->pTab==0 ); pFrom->pTab = pTab = sqlite3DbMallocZero(db, sizeof(Table)); if( pTab==0 ) return WRC_Abort; pTab->nRef = 1; pTab->zName = sqlite3DbStrDup(db, pCte->zName); pTab->iPKey = -1; pTab->nRowLogEst = 200; assert( 200==sqlite3LogEst(1048576) ); pTab->tabFlags \|= TF_Ephemeral; pFrom->pSelect = sqlite3SelectDup(db, pCte->pSelect, 0); if( db->mallocFailed ) return SQLITE_NOMEM; assert( pFrom->pSelect ); /* Check if this is a recursive CTE. */ pSel = pFrom->pSelect;
︙			︙
4001 4002 4003 4004 4005 4006 4007 ~~4008~~ 4009 4010 4011 4012 4013 4014 4015	pFrom->pTab = pTab = sqlite3DbMallocZero(db, sizeof(Table)); if( pTab==0 ) return WRC_Abort; pTab->nRef = 1; pTab->zName = sqlite3MPrintf(db, "sqlite_sq_%p", (void)pTab); while( pSel->pPrior ){ pSel = pSel->pPrior; } selectColumnsFromExprList(pParse, pSel->pEList, &pTab->nCol, &pTab->aCol); pTab->iPKey = -1; ~~pTab->nRowEst = 1048576;~~ pTab->tabFlags \|= TF_Ephemeral; #endif }else{ / An ordinary table or view name in the FROM clause */ assert( pFrom->pTab==0 ); pFrom->pTab = pTab = sqlite3LocateTableItem(pParse, 0, pFrom); if( pTab==0 ) return WRC_Abort;	\|	4001 4002 4003 4004 4005 4006 4007 4008 4009 4010 4011 4012 4013 4014 4015	pFrom->pTab = pTab = sqlite3DbMallocZero(db, sizeof(Table)); if( pTab==0 ) return WRC_Abort; pTab->nRef = 1; pTab->zName = sqlite3MPrintf(db, "sqlite_sq_%p", (void)pTab); while( pSel->pPrior ){ pSel = pSel->pPrior; } selectColumnsFromExprList(pParse, pSel->pEList, &pTab->nCol, &pTab->aCol); pTab->iPKey = -1; pTab->nRowLogEst = 200; assert( 200==sqlite3LogEst(1048576) ); pTab->tabFlags \|= TF_Ephemeral; #endif }else{ / An ordinary table or view name in the FROM clause */ assert( pFrom->pTab==0 ); pFrom->pTab = pTab = sqlite3LocateTableItem(pParse, 0, pFrom); if( pTab==0 ) return WRC_Abort;
︙			︙
4651 4652 4653 4654 4655 4656 4657 ~~4658~~ 4659 4660 4661 4662 4663 4664 4665	pItem->regReturn = ++pParse->nMem; sqlite3VdbeAddOp3(v, OP_InitCoroutine, pItem->regReturn, 0, addrTop); VdbeComment((v, "%s", pItem->pTab->zName)); pItem->addrFillSub = addrTop; sqlite3SelectDestInit(&dest, SRT_Coroutine, pItem->regReturn); explainSetInteger(pItem->iSelectId, (u8)pParse->iNextSelectId); sqlite3Select(pParse, pSub, &dest); ~~pItem->pTab->nRowEst = (~~unsigned)~~pSub->nSelectRow;~~ pItem->viaCoroutine = 1; pItem->regResult = dest.iSdst; sqlite3VdbeAddOp1(v, OP_EndCoroutine, pItem->regReturn); sqlite3VdbeJumpHere(v, addrTop-1); sqlite3ClearTempRegCache(pParse); }else{ /* Generate a subroutine that will fill an ephemeral table with	\|	4651 4652 4653 4654 4655 4656 4657 4658 4659 4660 4661 4662 4663 4664 4665	pItem->regReturn = ++pParse->nMem; sqlite3VdbeAddOp3(v, OP_InitCoroutine, pItem->regReturn, 0, addrTop); VdbeComment((v, "%s", pItem->pTab->zName)); pItem->addrFillSub = addrTop; sqlite3SelectDestInit(&dest, SRT_Coroutine, pItem->regReturn); explainSetInteger(pItem->iSelectId, (u8)pParse->iNextSelectId); sqlite3Select(pParse, pSub, &dest); pItem->pTab->nRowLogEst = sqlite3LogEst(pSub->nSelectRow); pItem->viaCoroutine = 1; pItem->regResult = dest.iSdst; sqlite3VdbeAddOp1(v, OP_EndCoroutine, pItem->regReturn); sqlite3VdbeJumpHere(v, addrTop-1); sqlite3ClearTempRegCache(pParse); }else{ /* Generate a subroutine that will fill an ephemeral table with
︙			︙
4682 4683 4684 4685 4686 4687 4688 ~~4689~~ 4690 4691 4692 4693 4694 4695 4696	VdbeComment((v, "materialize \"%s\"", pItem->pTab->zName)); }else{ VdbeNoopComment((v, "materialize \"%s\"", pItem->pTab->zName)); } sqlite3SelectDestInit(&dest, SRT_EphemTab, pItem->iCursor); explainSetInteger(pItem->iSelectId, (u8)pParse->iNextSelectId); sqlite3Select(pParse, pSub, &dest); ~~pItem->pTab->nRowEst = (~~unsigned)~~pSub->nSelectRow;~~ if( onceAddr ) sqlite3VdbeJumpHere(v, onceAddr); retAddr = sqlite3VdbeAddOp1(v, OP_Return, pItem->regReturn); VdbeComment((v, "end %s", pItem->pTab->zName)); sqlite3VdbeChangeP1(v, topAddr, retAddr); sqlite3ClearTempRegCache(pParse); } if( /pParse->nErr \|\|/ db->mallocFailed ){	\|	4682 4683 4684 4685 4686 4687 4688 4689 4690 4691 4692 4693 4694 4695 4696	VdbeComment((v, "materialize \"%s\"", pItem->pTab->zName)); }else{ VdbeNoopComment((v, "materialize \"%s\"", pItem->pTab->zName)); } sqlite3SelectDestInit(&dest, SRT_EphemTab, pItem->iCursor); explainSetInteger(pItem->iSelectId, (u8)pParse->iNextSelectId); sqlite3Select(pParse, pSub, &dest); pItem->pTab->nRowLogEst = sqlite3LogEst(pSub->nSelectRow); if( onceAddr ) sqlite3VdbeJumpHere(v, onceAddr); retAddr = sqlite3VdbeAddOp1(v, OP_Return, pItem->regReturn); VdbeComment((v, "end %s", pItem->pTab->zName)); sqlite3VdbeChangeP1(v, topAddr, retAddr); sqlite3ClearTempRegCache(pParse); } if( /pParse->nErr \|\|/ db->mallocFailed ){
︙			︙

︙			︙
521 522 523 524 525 526 527 ~~528~~ 529 530 ~~531~~ 532 533 534 535 536 537 538	/* Estimated quantities used for query planning are stored as 16-bit logarithms. For quantity X, the value stored is 10log2(X). This * gives a possible range of values of approximately 1.0e986 to 1e-986. But the allowed values are "grainy". Not every value is representable. For example, quantities 16 and 17 are both represented by a LogEst of 40. However, since LogEst quantatites are suppose to be estimates, not exact values, this imprecision is not a problem. "LogEst" is short for "Logarithimic Estimate". Examples: 1 -> 0 20 -> 43 10000 -> 132 2 -> 10 25 -> 46 25000 -> 146 3 -> 16 100 -> 66 1000000 -> 199 4 -> 20 1000 -> 99 1048576 -> 200 ** 10 -> 33 1024 -> 100 4294967296 -> 320	\| \|	521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538	/* Estimated quantities used for query planning are stored as 16-bit logarithms. For quantity X, the value stored is 10log2(X). This * gives a possible range of values of approximately 1.0e986 to 1e-986. But the allowed values are "grainy". Not every value is representable. For example, quantities 16 and 17 are both represented by a LogEst of 40. However, since LogEst quantaties are suppose to be estimates, not exact values, this imprecision is not a problem. "LogEst" is short for "Logarithmic Estimate". Examples: 1 -> 0 20 -> 43 10000 -> 132 2 -> 10 25 -> 46 25000 -> 146 3 -> 16 100 -> 66 1000000 -> 199 4 -> 20 1000 -> 99 1048576 -> 200 ** 10 -> 33 1024 -> 100 4294967296 -> 320
︙			︙
1467 1468 1469 1470 1471 1472 1473 ~~1474~~ 1475 1476 1477 1478 1479 1480 1481	Index pIndex; / List of SQL indexes on this table. / Select pSelect; /* NULL for tables. Points to definition if a view. / FKey pFKey; /* Linked list of all foreign keys in this table / char zColAff; /* String defining the affinity of each column / #ifndef SQLITE_OMIT_CHECK ExprList pCheck; /* All CHECK constraints / #endif ~~~~tRowcn~~t nRowEst; / Estimated rows in table - from sqlite_stat1 table /~~ int tnum; / Root BTree node for this table (see note above) / i16 iPKey; / If not negative, use aCol[iPKey] as the primary key / i16 nCol; / Number of columns in this table / u16 nRef; / Number of pointers to this Table / LogEst szTabRow; / Estimated size of each table row in bytes / u8 tabFlags; / Mask of TF_* values / u8 keyConf; / What to do in case of uniqueness conflict on iPKey */	\|	1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481	Index pIndex; / List of SQL indexes on this table. / Select pSelect; /* NULL for tables. Points to definition if a view. / FKey pFKey; /* Linked list of all foreign keys in this table / char zColAff; /* String defining the affinity of each column / #ifndef SQLITE_OMIT_CHECK ExprList pCheck; /* All CHECK constraints / #endif LogEst nRowLogEst; / Estimated rows in table - from sqlite_stat1 table / int tnum; / Root BTree node for this table (see note above) / i16 iPKey; / If not negative, use aCol[iPKey] as the primary key / i16 nCol; / Number of columns in this table / u16 nRef; / Number of pointers to this Table / LogEst szTabRow; / Estimated size of each table row in bytes / u8 tabFlags; / Mask of TF_* values / u8 keyConf; / What to do in case of uniqueness conflict on iPKey */
︙			︙
1676 1677 1678 1679 1680 1681 1682 ~~1683~~ 1684 1685 1686 1687 1688 1689 1690	and the value of Index.onError indicate the which conflict resolution algorithm to employ whenever an attempt is made to insert a non-unique ** element. / struct Index { char zName; /* Name of this index / i16 aiColumn; /* Which columns are used by this index. 1st is 0 / ~~~~tRowcn~~t aiRowEst; /* From ANALYZE: Est. rows selected by each column /~~ Table pTable; /* The SQL table being indexed / char zColAff; /* String defining the affinity of each column / Index pNext; /* The next index associated with the same table / Schema pSchema; /* Schema containing this index / u8 aSortOrder; /* for each column: True==DESC, False==ASC / char azColl; / Array of collation sequence names for index / Expr pPartIdxWhere; /* WHERE clause for partial indices */	\|	1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690	and the value of Index.onError indicate the which conflict resolution algorithm to employ whenever an attempt is made to insert a non-unique ** element. / struct Index { char zName; /* Name of this index / i16 aiColumn; /* Which columns are used by this index. 1st is 0 / LogEst aiRowLogEst; /* From ANALYZE: Est. rows selected by each column / Table pTable; /* The SQL table being indexed / char zColAff; /* String defining the affinity of each column / Index pNext; /* The next index associated with the same table / Schema pSchema; /* Schema containing this index / u8 aSortOrder; /* for each column: True==DESC, False==ASC / char azColl; / Array of collation sequence names for index / Expr pPartIdxWhere; /* WHERE clause for partial indices */
︙			︙

︙			︙
223 224 225 226 227 228 229 ~~230~~ 231 232 233 234 235 236 237	} pWC->nSlot = sqlite3DbMallocSize(db, pWC->a)/sizeof(pWC->a[0]); } pTerm = &pWC->a[idx = pWC->nTerm++]; if( p && ExprHasProperty(p, EP_Unlikely) ){ pTerm->truthProb = sqlite3LogEst(p->iTable) - 99; }else{ ~~pTerm->truthProb = -1;~~ } pTerm->pExpr = sqlite3ExprSkipCollate(p); pTerm->wtFlags = wtFlags; pTerm->pWC = pWC; pTerm->iParent = -1; return idx; }	\|	223 224 225 226 227 228 229 230 231 232 233 234 235 236 237	} pWC->nSlot = sqlite3DbMallocSize(db, pWC->a)/sizeof(pWC->a[0]); } pTerm = &pWC->a[idx = pWC->nTerm++]; if( p && ExprHasProperty(p, EP_Unlikely) ){ pTerm->truthProb = sqlite3LogEst(p->iTable) - 99; }else{ pTerm->truthProb = 1; } pTerm->pExpr = sqlite3ExprSkipCollate(p); pTerm->wtFlags = wtFlags; pTerm->pWC = pWC; pTerm->iParent = -1; return idx; }
︙			︙
1952 1953 1954 1955 1956 1957 1958 ~~1959~~ 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982 1983	aStat[1] = aSample[i].anEq[iCol]; }else{ tRowcnt iLower, iUpper, iGap; if( i==0 ){ iLower = 0; iUpper = aSample[0].anLt[iCol]; }else{ ~~iUpper = i>=pIdx->nSample ? ~~pIdx->aiRowEst[0]~~ : aSample[i].anLt[iCol];~~ iLower = aSample[i-1].anEq[iCol] + aSample[i-1].anLt[iCol]; } aStat[1] = (pIdx->nKeyCol>iCol ? pIdx->aAvgEq[iCol] : 1); if( iLower>=iUpper ){ iGap = 0; }else{ iGap = iUpper - iLower; } if( roundUp ){ iGap = (iGap2)/3; }else{ iGap = iGap/3; } aStat[0] = iLower + iGap; } } #endif / SQLITE_ENABLE_STAT3_OR_STAT4 / / This function is used to estimate the number of rows that will be visited by scanning an index for a range of values. The range may have an upper bound, a lower bound, or both. The WHERE clause terms that set the upper and lower bounds are represented by pLower and pUpper respectively. For ** example, assuming that index p is on t1(a):	> \| > > > > > > > > > > > > > > > > > > > > > > >	1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982 1983 1984 1985 1986 1987 1988 1989 1990 1991 1992 1993 1994 1995 1996 1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007	aStat[1] = aSample[i].anEq[iCol]; }else{ tRowcnt iLower, iUpper, iGap; if( i==0 ){ iLower = 0; iUpper = aSample[0].anLt[iCol]; }else{ i64 nRow0 = sqlite3LogEstToInt(pIdx->aiRowLogEst[0]); iUpper = i>=pIdx->nSample ? nRow0 : aSample[i].anLt[iCol]; iLower = aSample[i-1].anEq[iCol] + aSample[i-1].anLt[iCol]; } aStat[1] = (pIdx->nKeyCol>iCol ? pIdx->aAvgEq[iCol] : 1); if( iLower>=iUpper ){ iGap = 0; }else{ iGap = iUpper - iLower; } if( roundUp ){ iGap = (iGap2)/3; }else{ iGap = iGap/3; } aStat[0] = iLower + iGap; } } #endif / SQLITE_ENABLE_STAT3_OR_STAT4 / / If it is not NULL, pTerm is a term that provides an upper or lower bound on a range scan. Without considering pTerm, it is estimated that the scan will visit nNew rows. This function returns the number estimated to be visited after taking pTerm into account. If the user explicitly specified a likelihood() value for this term, then the return value is the likelihood multiplied by the number of input rows. Otherwise, this function assumes that an "IS NOT NULL" term ** has a likelihood of 0.50, and any other term a likelihood of 0.25. / static LogEst whereRangeAdjust(WhereTerm pTerm, LogEst nNew){ LogEst nRet = nNew; if( pTerm ){ if( pTerm->truthProb<=0 ){ nRet += pTerm->truthProb; }else if( (pTerm->wtFlags & TERM_VNULL)==0 ){ nRet -= 20; assert( 20==sqlite3LogEst(4) ); } } return nRet; } /* This function is used to estimate the number of rows that will be visited by scanning an index for a range of values. The range may have an upper bound, a lower bound, or both. The WHERE clause terms that set the upper and lower bounds are represented by pLower and pUpper respectively. For ** example, assuming that index p is on t1(a):
︙			︙
2063 2064 2065 2066 2067 2068 2069 ~~2070~~ 2071 2072 2073 2074 2075 2076 2077	aff = SQLITE_AFF_INTEGER; }else{ aff = p->pTable->aCol[p->aiColumn[nEq]].affinity; } /* Determine iLower and iUpper using ($P) only. / if( nEq==0 ){ iLower = 0; ~~iUpper = p->aiRowEst[0];~~ }else{ / Note: this call could be optimized away - since the same values must ** have been requested when testing key $P in whereEqualScanEst(). */ whereKeyStats(pParse, p, pRec, 0, a); iLower = a[0]; iUpper = a[0] + a[1]; }	\|	2087 2088 2089 2090 2091 2092 2093 2094 2095 2096 2097 2098 2099 2100 2101	aff = SQLITE_AFF_INTEGER; }else{ aff = p->pTable->aCol[p->aiColumn[nEq]].affinity; } /* Determine iLower and iUpper using ($P) only. / if( nEq==0 ){ iLower = 0; iUpper = sqlite3LogEstToInt(p->aiRowLogEst[0]); }else{ / Note: this call could be optimized away - since the same values must ** have been requested when testing key $P in whereEqualScanEst(). */ whereKeyStats(pParse, p, pRec, 0, a); iLower = a[0]; iUpper = a[0] + a[1]; }
︙			︙
2123 2124 2125 2126 2127 2128 2129 ~~2130 2131 2132 2133 2134 2135~~ ~~2136 2137~~ ~~2138 2139 2140~~ 2141 2142 2143 2144 2145 2146 2147	} } #else UNUSED_PARAMETER(pParse); UNUSED_PARAMETER(pBuilder); #endif assert( pLower \|\| pUpper ); ~~/* TUNING: Each inequality constraint reduces the search space 4-fold.~~ ** A BETWEEN operator, therefore, reduces the search space 16-fold */ ~~nNew = nOut;~~ if( p~~Low~~er && (p~~Low~~er->wtFlags & TERM_VNULL)==0 ){ ~~nNew -= 20; assert( 20==sqlite3LogEst(4) );~~ nOut--; ~~} i~~f( pU~~pper ){~~ ~~nNew -= 20~~; assert( 20==sqlite3LogEst(4) )~~; ~~nOut--;~~ }~~ if( nNew<10 ) nNew = 10; if( nNew<nOut ) nOut = nNew; pLoop->nOut = (LogEst)nOut; return rc; } #ifdef SQLITE_ENABLE_STAT3_OR_STAT4	< < < \| < \| > \| \| > > > > \| < \| >	2147 2148 2149 2150 2151 2152 2153 2154 2155 2156 2157 2158 2159 2160 2161 2162 2163 2164 2165 2166 2167 2168 2169 2170 2171 2172	} } #else UNUSED_PARAMETER(pParse); UNUSED_PARAMETER(pBuilder); #endif assert( pLower \|\| pUpper ); assert( pUpper==0 \|\| (pUpper->wtFlags & TERM_VNULL)==0 ); nNew = whereRangeAdjust(pLower, nOut); nNew = whereRangeAdjust(pUpper, nNew); /* TUNING: If there is both an upper and lower limit, assume the range is reduced by an additional 75%. This means that, by default, an open-ended range query (e.g. col > ?) is assumed to match 1/4 of the rows in the index. While a closed range (e.g. col BETWEEN ? AND ?) is estimated to match 1/64 of the index. */ if( pLower && pUpper ) nNew -= 20; nOut -= (pLower!=0) + (pUpper!=0); if( nNew<10 ) nNew = 10; if( nNew<nOut ) nOut = nNew; pLoop->nOut = (LogEst)nOut; return rc; } #ifdef SQLITE_ENABLE_STAT3_OR_STAT4
︙			︙
2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 ~~2245~~ 2246 2247 2248 2249 2250 2251 ~~2252~~ 2253 2254 2255 2256 2257 2258 2259	static int whereInScanEst( Parse pParse, / Parsing & code generating context / WhereLoopBuilder pBuilder, ExprList pList, / The value list on the RHS of "x IN (v1,v2,v3,...)" / tRowcnt pnRow /* Write the revised row estimate here / ){ Index p = pBuilder->pNew->u.btree.pIndex; int nRecValid = pBuilder->nRecValid; int rc = SQLITE_OK; /* Subfunction return code / tRowcnt nEst; / Number of rows for a single term / tRowcnt nRowEst = 0; / New estimate of the number of rows / int i; / Loop counter / assert( p->aSample!=0 ); for(i=0; rc==SQLITE_OK && i<pList->nExpr; i++){ ~~nEst = ~~p->aiRowEst[0]~~;~~ rc = whereEqualScanEst(pParse, pBuilder, pList->a[i].pExpr, &nEst); nRowEst += nEst; pBuilder->nRecValid = nRecValid; } if( rc==SQLITE_OK ){ ~~if( nRowEst > ~~p->aiRowEst[0]~~ ) nRowEst = ~~p->aiRowEst[0]~~;~~ pnRow = nRowEst; WHERETRACE(0x10,("IN row estimate: est=%g\n", nRowEst)); } assert( pBuilder->nRecValid==nRecValid ); return rc; } #endif /* SQLITE_ENABLE_STAT3_OR_STAT4 */	> \| \|	2255 2256 2257 2258 2259 2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285	static int whereInScanEst( Parse pParse, / Parsing & code generating context / WhereLoopBuilder pBuilder, ExprList pList, / The value list on the RHS of "x IN (v1,v2,v3,...)" / tRowcnt pnRow /* Write the revised row estimate here / ){ Index p = pBuilder->pNew->u.btree.pIndex; i64 nRow0 = sqlite3LogEstToInt(p->aiRowLogEst[0]); int nRecValid = pBuilder->nRecValid; int rc = SQLITE_OK; /* Subfunction return code / tRowcnt nEst; / Number of rows for a single term / tRowcnt nRowEst = 0; / New estimate of the number of rows / int i; / Loop counter / assert( p->aSample!=0 ); for(i=0; rc==SQLITE_OK && i<pList->nExpr; i++){ nEst = nRow0; rc = whereEqualScanEst(pParse, pBuilder, pList->a[i].pExpr, &nEst); nRowEst += nEst; pBuilder->nRecValid = nRecValid; } if( rc==SQLITE_OK ){ if( nRowEst > nRow0 ) nRowEst = nRow0; pnRow = nRowEst; WHERETRACE(0x10,("IN row estimate: est=%g\n", nRowEst)); } assert( pBuilder->nRecValid==nRecValid ); return rc; } #endif /* SQLITE_ENABLE_STAT3_OR_STAT4 */
︙			︙
3756 3757 3758 3759 3760 3761 3762 3763 3764 3765 3766 3767 3768 3769 3770 3771 3772	To say "WhereLoop X is a proper subset of Y" means that X uses fewer WHERE clause terms than Y and that every WHERE clause term used by X is also used by Y. / static void whereLoopAdjustCost(const WhereLoop p, WhereLoop pTemplate){ if( (pTemplate->wsFlags & WHERE_INDEXED)==0 ) return; for(; p; p=p->pNextLoop){ if( p->iTab!=pTemplate->iTab ) continue; if( (p->wsFlags & WHERE_INDEXED)==0 ) continue; if( whereLoopCheaperProperSubset(p, pTemplate) ){ / Adjust pTemplate cost downward so that it is cheaper than its ** subset p / pTemplate->rRun = p->rRun; pTemplate->nOut = p->nOut - 1; }else if( whereLoopCheaperProperSubset(pTemplate, p) ){ / Adjust pTemplate cost upward so that it is costlier than p since	> >	3782 3783 3784 3785 3786 3787 3788 3789 3790 3791 3792 3793 3794 3795 3796 3797 3798 3799 3800	To say "WhereLoop X is a proper subset of Y" means that X uses fewer WHERE clause terms than Y and that every WHERE clause term used by X is also used by Y. / static void whereLoopAdjustCost(const WhereLoop p, WhereLoop pTemplate){ if( (pTemplate->wsFlags & WHERE_INDEXED)==0 ) return; if( (pTemplate->wsFlags & WHERE_SKIPSCAN)!=0 ) return; for(; p; p=p->pNextLoop){ if( p->iTab!=pTemplate->iTab ) continue; if( (p->wsFlags & WHERE_INDEXED)==0 ) continue; if( (p->wsFlags & WHERE_SKIPSCAN)!=0 ) continue; if( whereLoopCheaperProperSubset(p, pTemplate) ){ / Adjust pTemplate cost downward so that it is cheaper than its ** subset p / pTemplate->rRun = p->rRun; pTemplate->nOut = p->nOut - 1; }else if( whereLoopCheaperProperSubset(pTemplate, p) ){ / Adjust pTemplate cost upward so that it is costlier than p since
︙			︙
3983 3984 3985 3986 3987 3988 3989 ~~3990~~ 3991 3992 3993 3994 ~~3995 3996~~ 3997 3998 3999 4000 4001 4002 4003	if( (pTerm->prereqAll & notAllowed)!=0 ) continue; for(j=pLoop->nLTerm-1; j>=0; j--){ pX = pLoop->aLTerm[j]; if( pX==0 ) continue; if( pX==pTerm ) break; if( pX->iParent>=0 && (&pWC->a[pX->iParent])==pTerm ) break; } ~~if( j<0 ) ~~pLoop->nOut += pTerm->truthProb;~~~~ } } /* We have so far matched pBuilder->pNew->u.btree.nEq terms of the ~~index pIndex.~~ Try to match one more. If pProbe->tnum==0, that means pIndex is a fake index used for the ** INTEGER PRIMARY KEY. / static int whereLoopAddBtreeIndex( WhereLoopBuilder pBuilder, /* The WhereLoop factory / struct SrcList_item pSrc, /* FROM clause term being analyzed */	\| > > \| \| > > > > >	4011 4012 4013 4014 4015 4016 4017 4018 4019 4020 4021 4022 4023 4024 4025 4026 4027 4028 4029 4030 4031 4032 4033 4034 4035 4036 4037 4038	if( (pTerm->prereqAll & notAllowed)!=0 ) continue; for(j=pLoop->nLTerm-1; j>=0; j--){ pX = pLoop->aLTerm[j]; if( pX==0 ) continue; if( pX==pTerm ) break; if( pX->iParent>=0 && (&pWC->a[pX->iParent])==pTerm ) break; } if( j<0 ){ pLoop->nOut += (pTerm->truthProb<=0 ? pTerm->truthProb : -1); } } } /* We have so far matched pBuilder->pNew->u.btree.nEq terms of the index pIndex. Try to match one more. When this function is called, pBuilder->pNew->nOut contains the number of rows expected to be visited by filtering using the nEq terms only. If it is modified, this value is restored before this function returns. If pProbe->tnum==0, that means pIndex is a fake index used for the INTEGER PRIMARY KEY. / static int whereLoopAddBtreeIndex( WhereLoopBuilder pBuilder, /* The WhereLoop factory / struct SrcList_item pSrc, /* FROM clause term being analyzed */
︙			︙
4015 4016 4017 4018 4019 4020 4021 ~~4022~~ 4023 4024 4025 4026 4027 4028 4029 4030 4031 4032 4033 4034 4035 4036 4037 4038 4039 4040 4041 4042 ~~4043 4044~~ 4045 4046 ~~4047~~ 4048 4049 4050 4051 4052 4053 4054 4055 4056 4057 ~~4058~~ 4059 4060 4061 ~~4062 4063 4064 4065~~ 4066 4067 4068 ~~4069~~ 4070 4071 4072 4073 4074 4075 4076 ~~4077 4078 4079 4080~~ 4081 4082 4083 4084 4085 4086 4087 ~~4088~~ 4089 4090 4091 4092 4093 4094 ~~4095 4096~~ 4097 4098 4099 4100 4101 4102 ~~4103~~ ~~4104~~ 4105 4106 4107 4108 4109 4110 4111 4112 4113 4114 4115 ~~4116 4117 4118 4119 4120 4121 4122 4123~~ 4124 ~~4125 4126~~ 4127 4128 4129 4130 4131 4132 ~~4133 4134 4135~~ 4136 ~~4137 4138 4139 4140 4141 4142 4143~~ 4144 4145 4146 4147 ~~4148 4149 4150~~ 4151 4152 4153 4154 4155 ~~4156~~ ~~4157~~ ~~4158~~ 4159 ~~4160~~ 4161 ~~4162 4163 4164 4165~~ ~~4166 4167 4168 4169 4170 4171 4172 4173 4174 4175 4176 4177~~ ~~4178 4179 4180~~ ~~4181 4182~~ 4183 4184 ~~4185 4186 4187~~ 4188 ~~4189~~ ~~4190~~ 4191 4192 4193 4194 4195 4196 4197 4198 4199	u16 saved_nLTerm; /* Original value of pNew->nLTerm / u16 saved_nEq; / Original value of pNew->u.btree.nEq / u16 saved_nSkip; / Original value of pNew->u.btree.nSkip / u32 saved_wsFlags; / Original value of pNew->wsFlags / LogEst saved_nOut; / Original value of pNew->nOut / int iCol; / Index of the column in the table / int rc = SQLITE_OK; / Return code / ~~LogEst nRowEst; / Estimated index selectivity /~~ LogEst rLogSize; / Logarithm of table size / WhereTerm pTop = 0, pBtm = 0; / Top and bottom range constraints / pNew = pBuilder->pNew; if( db->mallocFailed ) return SQLITE_NOMEM; assert( (pNew->wsFlags & WHERE_VIRTUALTABLE)==0 ); assert( (pNew->wsFlags & WHERE_TOP_LIMIT)==0 ); if( pNew->wsFlags & WHERE_BTM_LIMIT ){ opMask = WO_LT\|WO_LE; }else if( pProbe->tnum<=0 \|\| (pSrc->jointype & JT_LEFT)!=0 ){ opMask = WO_EQ\|WO_IN\|WO_GT\|WO_GE\|WO_LT\|WO_LE; }else{ opMask = WO_EQ\|WO_IN\|WO_ISNULL\|WO_GT\|WO_GE\|WO_LT\|WO_LE; } if( pProbe->bUnordered ) opMask &= ~(WO_GT\|WO_GE\|WO_LT\|WO_LE); assert( pNew->u.btree.nEq<=pProbe->nKeyCol ); if( pNew->u.btree.nEq < pProbe->nKeyCol ){ iCol = pProbe->aiColumn[pNew->u.btree.nEq]; ~~nRowEst = sqlite3LogEst(pProbe->aiRowEst[pNew->u.btree.nEq+1]);~~ ~~if( nRowEst==0 && pProbe->onError==OE_None ) nRowEst = 1;~~ }else{ iCol = -1; ~~nRowEst = 0;~~ } pTerm = whereScanInit(&scan, pBuilder->pWC, pSrc->iCursor, iCol, opMask, pProbe); saved_nEq = pNew->u.btree.nEq; saved_nSkip = pNew->u.btree.nSkip; saved_nLTerm = pNew->nLTerm; saved_wsFlags = pNew->wsFlags; saved_prereq = pNew->prereq; saved_nOut = pNew->nOut; pNew->rSetup = 0; ~~rLogSize = estLog(~~sqlite3LogEst(~~pProbe->aiRowEst[0]));~~ / Consider using a skip-scan if there are no WHERE clause constraints available for the left-most terms of the index, and if the average number of repeats in the left-most terms is at least 18. ~~The magic~~ number 18 was found by experimentation to be the payoff point where skip-scan become faster than a full-scan. / if( pTerm==0 && saved_nEq==saved_nSkip && saved_nEq+1<pProbe->nKeyCol ~~&& pProbe->aiRowEst[saved_nEq+1]>=18 / TUNING: Minimum for skip-scan /~~ && (rc = whereLoopResize(db, pNew, pNew->nLTerm+1))==SQLITE_OK ){ LogEst nIter; pNew->u.btree.nEq++; pNew->u.btree.nSkip++; pNew->aLTerm[pNew->nLTerm++] = 0; pNew->wsFlags \|= WHERE_SKIPSCAN; nIter = ~~sqlite3LogEst(~~pProbe->aiRowEst[~~0]/~~pProbe->aiRowEst[saved_nEq+1]); ~~pNew->rRun = rLogSize + nIter;~~ pNew->nOut += nIter; whereLoopAddBtreeIndex(pBuilder, pSrc, pProbe, nIter); pNew->nOut = saved_nOut; } for(; rc==SQLITE_OK && pTerm!=0; pTerm = whereScanNext(&scan)){ int nIn = 0; #ifdef SQLITE_ENABLE_STAT3_OR_STAT4 int nRecValid = pBuilder->nRecValid; #endif ~~if( (~~pTerm->eOperator~~==WO_ISNULL \|\| (pTerm->wtFlags&TERM_VNULL)!=0)~~ && (iCol<0 \|\| pSrc->pTab->aCol[iCol].notNull) ){ continue; / ignore IS [NOT] NULL constraints on NOT NULL columns / } if( pTerm->prereqRight & pNew->maskSelf ) continue; ~~assert( pNew->nOut==saved_nOut );~~ pNew->wsFlags = saved_wsFlags; pNew->u.btree.nEq = saved_nEq; pNew->nLTerm = saved_nLTerm; if( whereLoopResize(db, pNew, pNew->nLTerm+1) ) break; / OOM / pNew->aLTerm[pNew->nLTerm++] = pTerm; pNew->prereq = (saved_prereq \| pTerm->prereqRight) & ~pNew->maskSelf; ~~pNew->rRun = rLogSize; / Baseline cost is log2(N). Adjustments below /~~ ~~if( ~~pTerm->eOperator~~ & WO_IN ){~~ Expr pExpr = pTerm->pExpr; pNew->wsFlags \|= WHERE_COLUMN_IN; if( ExprHasProperty(pExpr, EP_xIsSelect) ){ /* "x IN (SELECT ...)": TUNING: the SELECT returns 25 rows / nIn = 46; assert( 46==sqlite3LogEst(25) ); }else if( ALWAYS(pExpr->x.pList && pExpr->x.pList->nExpr) ){ / "x IN (value, value, ...)" / nIn = sqlite3LogEst(pExpr->x.pList->nExpr); } assert( nIn>0 ); / RHS always has 2 or more terms... The parser ** changes "x IN (?)" into "x=?". / ~~pNew->rRun += nIn;~~ ~~pNew->u.btree.nEq++;~~ ~~pNew->nOut = nRowEst + nInMul + nIn;~~ }else if( ~~pTerm->eOperator~~ & (WO_EQ) ){ ~~assert(~~ ~~(pNew->wsFlags & (WHERE_COLUMN_NULL\|WHERE_COLUMN_IN\|WHERE_SKIPSCAN))!=0~~ ~~\|\| nInMul==0~~ ); pNew->wsFlags \|= WHERE_COLUMN_EQ; ~~if( iCol<0 \|\| (nInMul==0 && pNew->u.btree.nEq==pProbe->nKeyCol-1)){ ~~assert( (pNew->wsFlags & WHERE_COLUMN_IN)==0 \|\| iCol<0 );~~~~ if( iCol>=0 && pProbe->onError==OE_None ){ pNew->wsFlags \|= WHERE_UNQ_WANTED; }else{ pNew->wsFlags \|= WHERE_ONEROW; } } ~~~~pNew->u.btree.nEq++;~~ ~~pNew->nOut = nRowEst + nInMul;~~ }else if( ~~pTerm->~~eOp~~erator & (~~WO_ISNULL) ){~~ pNew->wsFlags \|= WHERE_COLUMN_NULL; ~~pNew->u.btree.nEq++;~~ ~~/ TUNING: IS NULL selects 2 rows /~~ ~~nIn = 10; assert( 10==sqlite3LogEst(2) );~~ ~~pNew->nOut = nRowEst + nInMul + nIn;~~ }else if( ~~pTerm->eOperator~~ & (WO_GT\|WO_GE) ){ testcase( ~~pTerm->eOperator~~ & WO_GT ); testcase( ~~pTerm->eOperator~~ & WO_GE ); pNew->wsFlags \|= WHERE_COLUMN_RANGE\|WHERE_BTM_LIMIT; pBtm = pTerm; pTop = 0; }else{ ~~assert( ~~pTerm->eOperator~~ & (WO_LT\|WO_LE) ); testcase( ~~pTerm->eOperator~~ & WO_LT ); testcase( ~~pTerm->eOperator~~ & WO_LE );~~ pNew->wsFlags \|= WHERE_COLUMN_RANGE\|WHERE_TOP_LIMIT; pTop = pTerm; pBtm = (pNew->wsFlags & WHERE_BTM_LIMIT)!=0 ? pNew->aLTerm[pNew->nLTerm-2] : 0; } ~~if( pNew->wsFlags & WHERE_COLUMN_RANGE ){~~ ~~~~/ Adjust nOut and rRun for STAT3 range~~ values /~~ ~~assert( pNew->nOut==saved_nOut );~~ whereRangeScanEst(pParse, pBuilder, pBtm, pTop, pNew); } #ifdef SQLITE_ENABLE_STAT3_OR_STAT4 ~~if( nInMul==0 && pProbe->nSample && pNew->u.btree.nEq<=pProbe->nSampleCol && OptimizationEnabled(db, SQLITE_Stat3)~~ ){ Expr pExpr = pTerm->pExpr; ~~tRowcnt nOut = 0;~~ if( (~~pTerm->eOperator~~ & (WO_EQ\|WO_ISNULL))!=0 ){ testcase( ~~pTerm->eOperator~~ & WO_EQ ); testcase( ~~pTerm->eOperator~~ & WO_ISNULL ); rc = whereEqualScanEst(pParse, pBuilder, pExpr->pRight, &nOut); }else ~~if( (pTerm->eOperator & WO_IN)~~ ~~&& !ExprHasProperty(pExpr, EP_xIsSelect) ){~~ rc = whereInScanEst(pParse, pBuilder, pExpr->x.pList, &nOut); } assert( ~~nOut==0 \|\| rc=~~=SQLITE_OK ); ~~if( nOut ){ pNew->nOut = sqlite3LogEst(nOut); if( pNew->nOut>saved_nOut ) pNew->nOut = saved_nOut;~~ ~~} }~~ #endif if( (pNew->wsFlags & (WHERE_IDX_ONLY\|WHERE_IPK))==0 ){ ~~~~/* Each row involves a step of the index, then a binary search of~~ ** the main table / pNew->rRun = sqlite3LogEstAdd(pNew->rRun,~~rLogSiz~~e>27 ~~? rLogSize-17 :~~ 10);~~ } ~~/ Step cost for each output row */~~ ~~pNew->rRun = sql~~ite3LogEstAdd(pNew->rRu~~n~~, pNew->nOut)~~;~~ whereLoopOutputAdjust(pBuilder->pWC, pNew); rc = whereLoopInsert(pBuilder, pNew); if( (pNew->wsFlags & WHERE_TOP_LIMIT)==0 && pNew->u.btree.nEq<(pProbe->nKeyCol + (pProbe->zName!=0)) ){ whereLoopAddBtreeIndex(pBuilder, pSrc, pProbe, nInMul+nIn); } pNew->nOut = saved_nOut; #ifdef SQLITE_ENABLE_STAT3_OR_STAT4	< < < < \| \| < < \| > > > > > > > \| \| < \| \| > > > \| < < \| > > > > > > \| \| < < \| < < < < \| < < < \| < < < < \| \| \| \| \| \| \| > > \| > > \| > > > > > > \| > > > > > > > > \| \| \| \| > > \| \| < \| \| \| \| \| < \| \| \| > > \| \| \| > \| \| > > > > > > > > > > > > > > > > > > > < < \| \| > \| > > > > > > > >	4050 4051 4052 4053 4054 4055 4056 4057 4058 4059 4060 4061 4062 4063 4064 4065 4066 4067 4068 4069 4070 4071 4072 4073 4074 4075 4076 4077 4078 4079 4080 4081 4082 4083 4084 4085 4086 4087 4088 4089 4090 4091 4092 4093 4094 4095 4096 4097 4098 4099 4100 4101 4102 4103 4104 4105 4106 4107 4108 4109 4110 4111 4112 4113 4114 4115 4116 4117 4118 4119 4120 4121 4122 4123 4124 4125 4126 4127 4128 4129 4130 4131 4132 4133 4134 4135 4136 4137 4138 4139 4140 4141 4142 4143 4144 4145 4146 4147 4148 4149 4150 4151 4152 4153 4154 4155 4156 4157 4158 4159 4160 4161 4162 4163 4164 4165 4166 4167 4168 4169 4170 4171 4172 4173 4174 4175 4176 4177 4178 4179 4180 4181 4182 4183 4184 4185 4186 4187 4188 4189 4190 4191 4192 4193 4194 4195 4196 4197 4198 4199 4200 4201 4202 4203 4204 4205 4206 4207 4208 4209 4210 4211 4212 4213 4214 4215 4216 4217 4218 4219 4220 4221 4222 4223 4224 4225 4226 4227 4228 4229 4230 4231 4232 4233 4234 4235 4236 4237 4238 4239 4240 4241 4242 4243 4244 4245 4246 4247 4248 4249 4250 4251 4252 4253 4254 4255 4256 4257 4258 4259 4260 4261 4262 4263 4264 4265 4266 4267 4268 4269 4270 4271 4272 4273 4274 4275	u16 saved_nLTerm; /* Original value of pNew->nLTerm / u16 saved_nEq; / Original value of pNew->u.btree.nEq / u16 saved_nSkip; / Original value of pNew->u.btree.nSkip / u32 saved_wsFlags; / Original value of pNew->wsFlags / LogEst saved_nOut; / Original value of pNew->nOut / int iCol; / Index of the column in the table / int rc = SQLITE_OK; / Return code / LogEst rLogSize; / Logarithm of table size / WhereTerm pTop = 0, pBtm = 0; / Top and bottom range constraints / pNew = pBuilder->pNew; if( db->mallocFailed ) return SQLITE_NOMEM; assert( (pNew->wsFlags & WHERE_VIRTUALTABLE)==0 ); assert( (pNew->wsFlags & WHERE_TOP_LIMIT)==0 ); if( pNew->wsFlags & WHERE_BTM_LIMIT ){ opMask = WO_LT\|WO_LE; }else if( pProbe->tnum<=0 \|\| (pSrc->jointype & JT_LEFT)!=0 ){ opMask = WO_EQ\|WO_IN\|WO_GT\|WO_GE\|WO_LT\|WO_LE; }else{ opMask = WO_EQ\|WO_IN\|WO_ISNULL\|WO_GT\|WO_GE\|WO_LT\|WO_LE; } if( pProbe->bUnordered ) opMask &= ~(WO_GT\|WO_GE\|WO_LT\|WO_LE); assert( pNew->u.btree.nEq<=pProbe->nKeyCol ); if( pNew->u.btree.nEq < pProbe->nKeyCol ){ iCol = pProbe->aiColumn[pNew->u.btree.nEq]; }else{ iCol = -1; } pTerm = whereScanInit(&scan, pBuilder->pWC, pSrc->iCursor, iCol, opMask, pProbe); saved_nEq = pNew->u.btree.nEq; saved_nSkip = pNew->u.btree.nSkip; saved_nLTerm = pNew->nLTerm; saved_wsFlags = pNew->wsFlags; saved_prereq = pNew->prereq; saved_nOut = pNew->nOut; pNew->rSetup = 0; rLogSize = estLog(pProbe->aiRowLogEst[0]); / Consider using a skip-scan if there are no WHERE clause constraints available for the left-most terms of the index, and if the average number of repeats in the left-most terms is at least 18. The magic number 18 is selected on the basis that scanning 17 rows is almost always quicker than an index seek (even though if the index contains fewer than 2^17 rows we assume otherwise in other parts of the code). And, even if it is not, it should not be too much slower. On the other hand, the extra seeks could end up being significantly ** more expensive. / assert( 42==sqlite3LogEst(18) ); if( pTerm==0 && saved_nEq==saved_nSkip && saved_nEq+1<pProbe->nKeyCol && pProbe->aiRowLogEst[saved_nEq+1]>=42 / TUNING: Minimum for skip-scan / && (rc = whereLoopResize(db, pNew, pNew->nLTerm+1))==SQLITE_OK ){ LogEst nIter; pNew->u.btree.nEq++; pNew->u.btree.nSkip++; pNew->aLTerm[pNew->nLTerm++] = 0; pNew->wsFlags \|= WHERE_SKIPSCAN; nIter = pProbe->aiRowLogEst[saved_nEq] - pProbe->aiRowLogEst[saved_nEq+1]; pNew->nOut -= nIter; whereLoopAddBtreeIndex(pBuilder, pSrc, pProbe, nIter + nInMul); pNew->nOut = saved_nOut; } for(; rc==SQLITE_OK && pTerm!=0; pTerm = whereScanNext(&scan)){ u16 eOp = pTerm->eOperator; / Shorthand for pTerm->eOperator / LogEst rCostIdx; LogEst nOutUnadjusted; / nOut before IN() and WHERE adjustments / int nIn = 0; #ifdef SQLITE_ENABLE_STAT3_OR_STAT4 int nRecValid = pBuilder->nRecValid; #endif if( (eOp==WO_ISNULL \|\| (pTerm->wtFlags&TERM_VNULL)!=0) && (iCol<0 \|\| pSrc->pTab->aCol[iCol].notNull) ){ continue; / ignore IS [NOT] NULL constraints on NOT NULL columns / } if( pTerm->prereqRight & pNew->maskSelf ) continue; pNew->wsFlags = saved_wsFlags; pNew->u.btree.nEq = saved_nEq; pNew->nLTerm = saved_nLTerm; if( whereLoopResize(db, pNew, pNew->nLTerm+1) ) break; / OOM / pNew->aLTerm[pNew->nLTerm++] = pTerm; pNew->prereq = (saved_prereq \| pTerm->prereqRight) & ~pNew->maskSelf; assert( nInMul==0 \|\| (pNew->wsFlags & WHERE_COLUMN_NULL)!=0 \|\| (pNew->wsFlags & WHERE_COLUMN_IN)!=0 \|\| (pNew->wsFlags & WHERE_SKIPSCAN)!=0 ); if( eOp & WO_IN ){ Expr pExpr = pTerm->pExpr; pNew->wsFlags \|= WHERE_COLUMN_IN; if( ExprHasProperty(pExpr, EP_xIsSelect) ){ /* "x IN (SELECT ...)": TUNING: the SELECT returns 25 rows / nIn = 46; assert( 46==sqlite3LogEst(25) ); }else if( ALWAYS(pExpr->x.pList && pExpr->x.pList->nExpr) ){ / "x IN (value, value, ...)" / nIn = sqlite3LogEst(pExpr->x.pList->nExpr); } assert( nIn>0 ); / RHS always has 2 or more terms... The parser ** changes "x IN (?)" into "x=?". / }else if( eOp & (WO_EQ) ){ pNew->wsFlags \|= WHERE_COLUMN_EQ; if( iCol<0 \|\| (nInMul==0 && pNew->u.btree.nEq==pProbe->nKeyCol-1) ){ if( iCol>=0 && pProbe->onError==OE_None ){ pNew->wsFlags \|= WHERE_UNQ_WANTED; }else{ pNew->wsFlags \|= WHERE_ONEROW; } } }else if( eOp & WO_ISNULL ){ pNew->wsFlags \|= WHERE_COLUMN_NULL; }else if( eOp & (WO_GT\|WO_GE) ){ testcase( eOp & WO_GT ); testcase( eOp & WO_GE ); pNew->wsFlags \|= WHERE_COLUMN_RANGE\|WHERE_BTM_LIMIT; pBtm = pTerm; pTop = 0; }else{ assert( eOp & (WO_LT\|WO_LE) ); testcase( eOp & WO_LT ); testcase( eOp & WO_LE ); pNew->wsFlags \|= WHERE_COLUMN_RANGE\|WHERE_TOP_LIMIT; pTop = pTerm; pBtm = (pNew->wsFlags & WHERE_BTM_LIMIT)!=0 ? pNew->aLTerm[pNew->nLTerm-2] : 0; } / At this point pNew->nOut is set to the number of rows expected to be visited by the index scan before considering term pTerm, or the values of nIn and nInMul. In other words, assuming that all "x IN(...)" terms are replaced with "x = ?". This block updates the value of pNew->nOut to account for pTerm (but not nIn/nInMul). / assert( pNew->nOut==saved_nOut ); if( pNew->wsFlags & WHERE_COLUMN_RANGE ){ / Adjust nOut using stat3/stat4 data. Or, if there is no stat3/stat4 ** data, using some other estimate. / whereRangeScanEst(pParse, pBuilder, pBtm, pTop, pNew); }else{ int nEq = ++pNew->u.btree.nEq; assert( eOp & (WO_ISNULL\|WO_EQ\|WO_IN) ); assert( pNew->nOut==saved_nOut ); if( pTerm->truthProb<=0 && iCol>=0 ){ assert( (eOp & WO_IN) \|\| nIn==0 ); pNew->nOut += pTerm->truthProb; pNew->nOut -= nIn; pNew->wsFlags \|= WHERE_LIKELIHOOD; }else{ #ifdef SQLITE_ENABLE_STAT3_OR_STAT4 tRowcnt nOut = 0; if( nInMul==0 && pProbe->nSample && pNew->u.btree.nEq<=pProbe->nSampleCol && OptimizationEnabled(db, SQLITE_Stat3) && ((eOp & WO_IN)==0 \|\| !ExprHasProperty(pTerm->pExpr, EP_xIsSelect)) && (pNew->wsFlags & WHERE_LIKELIHOOD)==0 ){ Expr pExpr = pTerm->pExpr; if( (eOp & (WO_EQ\|WO_ISNULL))!=0 ){ testcase( eOp & WO_EQ ); testcase( eOp & WO_ISNULL ); rc = whereEqualScanEst(pParse, pBuilder, pExpr->pRight, &nOut); }else{ rc = whereInScanEst(pParse, pBuilder, pExpr->x.pList, &nOut); } assert( rc!=SQLITE_OK \|\| nOut>0 ); if( rc==SQLITE_NOTFOUND ) rc = SQLITE_OK; if( rc!=SQLITE_OK ) break; /* Jump out of the pTerm loop / if( nOut ){ pNew->nOut = sqlite3LogEst(nOut); if( pNew->nOut>saved_nOut ) pNew->nOut = saved_nOut; pNew->nOut -= nIn; } } if( nOut==0 ) #endif { pNew->nOut += (pProbe->aiRowLogEst[nEq] - pProbe->aiRowLogEst[nEq-1]); if( eOp & WO_ISNULL ){ / TUNING: If there is no likelihood() value, assume that a "col IS NULL" expression matches twice as many rows as (col=?). / pNew->nOut += 10; } } } } / Set rCostIdx to the cost of visiting selected rows in index. Add it to pNew->rRun, which is currently set to the cost of the index seek only. Then, if this is a non-covering index, add the cost of ** visiting the rows in the main table. / rCostIdx = pNew->nOut + 1 + (15pProbe->szIdxRow)/pSrc->pTab->szTabRow; pNew->rRun = sqlite3LogEstAdd(rLogSize, rCostIdx); if( (pNew->wsFlags & (WHERE_IDX_ONLY\|WHERE_IPK))==0 ){ pNew->rRun = sqlite3LogEstAdd(pNew->rRun, pNew->nOut + 16); } nOutUnadjusted = pNew->nOut; pNew->rRun += nInMul + nIn; pNew->nOut += nInMul + nIn; whereLoopOutputAdjust(pBuilder->pWC, pNew); rc = whereLoopInsert(pBuilder, pNew); if( pNew->wsFlags & WHERE_COLUMN_RANGE ){ pNew->nOut = saved_nOut; }else{ pNew->nOut = nOutUnadjusted; } if( (pNew->wsFlags & WHERE_TOP_LIMIT)==0 && pNew->u.btree.nEq<(pProbe->nKeyCol + (pProbe->zName!=0)) ){ whereLoopAddBtreeIndex(pBuilder, pSrc, pProbe, nInMul+nIn); } pNew->nOut = saved_nOut; #ifdef SQLITE_ENABLE_STAT3_OR_STAT4
︙			︙
4269 4270 4271 4272 4273 4274 4275 4276 4277 4278 4279 4280 4281 4282 4283 ~~4284~~ 4285 4286 4287 4288 4289 4290 4291	return 0; } /* Add all WhereLoop objects for a single table of the join where the table is idenfied by pBuilder->pNew->iTab. That table is guaranteed to be ** a b-tree table, not a virtual table. / static int whereLoopAddBtree( WhereLoopBuilder pBuilder, /* WHERE clause information / Bitmask mExtra / Extra prerequesites for using this table / ){ WhereInfo pWInfo; /* WHERE analysis context / Index pProbe; /* An index we are evaluating / Index sPk; / A fake index object for the primary key / ~~~~tRowcn~~t aiRowEstPk[2]; / The aiRowEst[] value for the sPk index /~~ i16 aiColumnPk = -1; / The aColumn[] value for the sPk index / SrcList pTabList; /* The FROM clause / struct SrcList_item pSrc; /* The FROM clause btree term to add / WhereLoop pNew; /* Template WhereLoop object / int rc = SQLITE_OK; / Return code / int iSortIdx = 1; / Index number / int b; / A boolean value */	> > > > > > > > > > > > > > > > > > > > > > > \|	4345 4346 4347 4348 4349 4350 4351 4352 4353 4354 4355 4356 4357 4358 4359 4360 4361 4362 4363 4364 4365 4366 4367 4368 4369 4370 4371 4372 4373 4374 4375 4376 4377 4378 4379 4380 4381 4382 4383 4384 4385 4386 4387 4388 4389 4390	return 0; } /* Add all WhereLoop objects for a single table of the join where the table is idenfied by pBuilder->pNew->iTab. That table is guaranteed to be a b-tree table, not a virtual table. The costs (WhereLoop.rRun) of the b-tree loops added by this function are calculated as follows: For a full scan, assuming the table (or index) contains nRow rows: cost = nRow * 3.0 // full-table scan ** cost = nRow * K // scan of covering index ** cost = nRow * (K+3.0) // scan of non-covering index where K is a value between 1.1 and 3.0 set based on the relative estimated average size of the index and table records. For an index scan, where nVisit is the number of index rows visited by the scan, and nSeek is the number of seek operations required on the index b-tree: ** cost = nSeek * (log(nRow) + K * nVisit) // covering index ** cost = nSeek * (log(nRow) + (K+3.0) * nVisit) // non-covering index Normally, nSeek is 1. nSeek values greater than 1 come about if the WHERE clause includes "x IN (....)" terms used in place of "x=?". Or when implicit "x IN (SELECT x FROM tbl)" terms are added for skip-scans. / static int whereLoopAddBtree( WhereLoopBuilder pBuilder, /* WHERE clause information / Bitmask mExtra / Extra prerequesites for using this table / ){ WhereInfo pWInfo; /* WHERE analysis context / Index pProbe; /* An index we are evaluating / Index sPk; / A fake index object for the primary key / LogEst aiRowEstPk[2]; / The aiRowLogEst[] value for the sPk index / i16 aiColumnPk = -1; / The aColumn[] value for the sPk index / SrcList pTabList; /* The FROM clause / struct SrcList_item pSrc; /* The FROM clause btree term to add / WhereLoop pNew; /* Template WhereLoop object / int rc = SQLITE_OK; / Return code / int iSortIdx = 1; / Index number / int b; / A boolean value */
︙			︙
4312 4313 4314 4315 4316 4317 4318 ~~4319~~ 4320 4321 ~~4322 4323~~ 4324 4325 4326 4327 4328 4329 4330 4331 ~~4332~~ 4333 4334 4335 4336 4337 4338 4339	variable sPk to represent the rowid primary key index. Make this fake index the first in a chain of Index objects with all of the real ** indices to follow / Index pFirst; /* First of real indices on the table / memset(&sPk, 0, sizeof(Index)); sPk.nKeyCol = 1; sPk.aiColumn = &aiColumnPk; ~~sPk.aiRowEst = aiRowEstPk;~~ sPk.onError = OE_Replace; sPk.pTable = pTab; ~~aiRowEstPk[0] = pTab->nRowEst; aiRowEstPk[1] = 1;~~ pFirst = pSrc->pTab->pIndex; if( pSrc->notIndexed==0 ){ / The real indices of the table are only considered if the ** NOT INDEXED qualifier is omitted from the FROM clause / sPk.pNext = pFirst; } pProbe = &sPk; } ~~rSize = ~~sqlite3LogEst(~~pTab->nRow~~Est)~~;~~ rLogSize = estLog(rSize); #ifndef SQLITE_OMIT_AUTOMATIC_INDEX / Automatic indexes */ if( !pBuilder->pOrSet && (pWInfo->pParse->db->flags & SQLITE_AutoIndex)!=0 && pSrc->pIndex==0	\| > \| \| \|	4411 4412 4413 4414 4415 4416 4417 4418 4419 4420 4421 4422 4423 4424 4425 4426 4427 4428 4429 4430 4431 4432 4433 4434 4435 4436 4437 4438 4439	variable sPk to represent the rowid primary key index. Make this fake index the first in a chain of Index objects with all of the real ** indices to follow / Index pFirst; /* First of real indices on the table / memset(&sPk, 0, sizeof(Index)); sPk.nKeyCol = 1; sPk.aiColumn = &aiColumnPk; sPk.aiRowLogEst = aiRowEstPk; sPk.onError = OE_Replace; sPk.pTable = pTab; sPk.szIdxRow = pTab->szTabRow; aiRowEstPk[0] = pTab->nRowLogEst; aiRowEstPk[1] = 0; pFirst = pSrc->pTab->pIndex; if( pSrc->notIndexed==0 ){ / The real indices of the table are only considered if the ** NOT INDEXED qualifier is omitted from the FROM clause / sPk.pNext = pFirst; } pProbe = &sPk; } rSize = pTab->nRowLogEst; rLogSize = estLog(rSize); #ifndef SQLITE_OMIT_AUTOMATIC_INDEX / Automatic indexes */ if( !pBuilder->pOrSet && (pWInfo->pParse->db->flags & SQLITE_AutoIndex)!=0 && pSrc->pIndex==0
︙			︙
4375 4376 4377 4378 4379 4380 4381 4382 4383 4384 4385 4386 4387 4388 4389 4390 4391 4392 4393 4394 4395 4396 4397 4398 ~~4399 4400 4401 4402~~ 4403 4404 4405 4406 4407 4408 4409	/* Loop over all indices / for(; rc==SQLITE_OK && pProbe; pProbe=pProbe->pNext, iSortIdx++){ if( pProbe->pPartIdxWhere!=0 && !whereUsablePartialIndex(pNew->iTab, pWC, pProbe->pPartIdxWhere) ){ continue; / Partial index inappropriate for this query / } pNew->u.btree.nEq = 0; pNew->u.btree.nSkip = 0; pNew->nLTerm = 0; pNew->iSortIdx = 0; pNew->rSetup = 0; pNew->prereq = mExtra; pNew->nOut = rSize; pNew->u.btree.pIndex = pProbe; b = indexMightHelpWithOrderBy(pBuilder, pProbe, pSrc->iCursor); / The ONEPASS_DESIRED flags never occurs together with ORDER BY / assert( (pWInfo->wctrlFlags & WHERE_ONEPASS_DESIRED)==0 \|\| b==0 ); if( pProbe->tnum<=0 ){ / Integer primary key index / pNew->wsFlags = WHERE_IPK; / Full table scan / pNew->iSortIdx = b ? iSortIdx : 0; / TUNING: Cost of full table scan is 3(N ~~+ log2(N)~~). * + The extra 3 factor is to encourage the use of indexed lookups ** over full scans. FIXME */ pNew->rRun = ~~sqlite3LogEstAdd(rSize,rLogSize)~~ + 16; whereLoopOutputAdjust(pWC, pNew); rc = whereLoopInsert(pBuilder, pNew); pNew->nOut = rSize; if( rc ) break; }else{ Bitmask m; if( pProbe->isCovering ){	> \| < < \|	4475 4476 4477 4478 4479 4480 4481 4482 4483 4484 4485 4486 4487 4488 4489 4490 4491 4492 4493 4494 4495 4496 4497 4498 4499 4500 4501 4502 4503 4504 4505 4506 4507 4508	/* Loop over all indices / for(; rc==SQLITE_OK && pProbe; pProbe=pProbe->pNext, iSortIdx++){ if( pProbe->pPartIdxWhere!=0 && !whereUsablePartialIndex(pNew->iTab, pWC, pProbe->pPartIdxWhere) ){ continue; / Partial index inappropriate for this query / } rSize = pProbe->aiRowLogEst[0]; pNew->u.btree.nEq = 0; pNew->u.btree.nSkip = 0; pNew->nLTerm = 0; pNew->iSortIdx = 0; pNew->rSetup = 0; pNew->prereq = mExtra; pNew->nOut = rSize; pNew->u.btree.pIndex = pProbe; b = indexMightHelpWithOrderBy(pBuilder, pProbe, pSrc->iCursor); / The ONEPASS_DESIRED flags never occurs together with ORDER BY / assert( (pWInfo->wctrlFlags & WHERE_ONEPASS_DESIRED)==0 \|\| b==0 ); if( pProbe->tnum<=0 ){ / Integer primary key index / pNew->wsFlags = WHERE_IPK; / Full table scan / pNew->iSortIdx = b ? iSortIdx : 0; / TUNING: Cost of full table scan is (N3.0). / pNew->rRun = rSize + 16; whereLoopOutputAdjust(pWC, pNew); rc = whereLoopInsert(pBuilder, pNew); pNew->nOut = rSize; if( rc ) break; }else{ Bitmask m; if( pProbe->isCovering ){
︙			︙
4422 4423 4424 4425 4426 4427 4428 ~~4429 4430 4431 4432 4433 4434 4435 4436 4437 4438 4439 4440 4441~~ ~~4442 4443 4444 4445 4446 4447 4448 4449 4450 4451 4452 4453 4454 4455 4456~~ 4457 4458 4459 4460 4461 4462 4463 4464	&& (pProbe->szIdxRow<pTab->szTabRow) && (pWInfo->wctrlFlags & WHERE_ONEPASS_DESIRED)==0 && sqlite3GlobalConfig.bUseCis && OptimizationEnabled(pWInfo->pParse->db, SQLITE_CoverIdxScan) ) ){ pNew->iSortIdx = b ? iSortIdx : 0; ~~/* TUNING: The base cost of an index scan is N + log2(N).~~ The log2(N) is for the initial seek to the beginning and the N is for the scan itself. / ~~pNew->rRun = sqlite3LogEstAdd(rSize, rLogSize);~~ ~~if( m==0 ){~~ ~~/ TUNING: C~~ost of ~~a cover~~ing index ~~scan~~ is K(N ~~+ log2(N)).~~ * + The extra factor K of between 1.1 and 3.0 that depends on the relative sizes of the ~~table and the index. K~~ is smaller for smaller indices, thus favoring them. The upper bound on K (3.0) matches the penalty factor on a full table scan that tries to encourage the use of ** indexed l~~ookup~~s over ~~full~~ scans. / pNew->rRun += 1 + (15pProbe->szIdxRow)/pTab->szTabRow; ~~}else{~~ ~~/* TUNING: The cost of scanning a non-covering index is multiplied~~ by log2(N) to account for the binary search of the main table that must happen for each row of the index. TODO: Should there be a multiplier here, analogous to the 3x multiplier for a fulltable scan or covering index scan, to further discourage the use of an index scan? Or is the log2(N) term sufficient discouragement? TODO: What if some or all of the WHERE clause terms can be computed without reference to the original table. Then the penality should reduce to logK where K is the number of output rows. */ pNew->rRun ~~+= r~~LogSize; } whereLoopOutputAdjust(pWC, pNew); rc = whereLoopInsert(pBuilder, pNew); pNew->nOut = rSize; if( rc ) break; } }	\| < < < < \| < \| < < < \| < > \| < < < < < < < < < < < \| < \| >	4521 4522 4523 4524 4525 4526 4527 4528 4529 4530 4531 4532 4533 4534 4535 4536 4537 4538 4539 4540 4541 4542 4543 4544	&& (pProbe->szIdxRow<pTab->szTabRow) && (pWInfo->wctrlFlags & WHERE_ONEPASS_DESIRED)==0 && sqlite3GlobalConfig.bUseCis && OptimizationEnabled(pWInfo->pParse->db, SQLITE_CoverIdxScan) ) ){ pNew->iSortIdx = b ? iSortIdx : 0; /* The cost of visiting the index rows is NK, where K is * between 1.1 and 3.0, depending on the relative sizes of the index and table rows. If this is a non-covering index scan, also add the cost of visiting table rows (N3.0). / pNew->rRun = rSize + 1 + (15*pProbe->szIdxRow)/pTab->szTabRow; if( m!=0 ){ pNew->rRun = sqlite3LogEstAdd(pNew->rRun, rSize+16); } whereLoopOutputAdjust(pWC, pNew); rc = whereLoopInsert(pBuilder, pNew); pNew->nOut = rSize; if( rc ) break; } }
︙			︙
4728 4729 4730 4731 4732 4733 4734 ~~4735 4736~~ 4737 4738 4739 4740 4741 4742 4743	pNew->nLTerm = 1; pNew->aLTerm[0] = pTerm; pNew->wsFlags = WHERE_MULTI_OR; pNew->rSetup = 0; pNew->iSortIdx = 0; memset(&pNew->u, 0, sizeof(pNew->u)); for(i=0; rc==SQLITE_OK && i<sSum.n; i++){ ~~~~/* TUNING: Multiple by 3.5 for the secondary table lookup */~~ pNew->rRun = sSum.a[i].rRun ~~+ 18~~;~~ pNew->nOut = sSum.a[i].nOut; pNew->prereq = sSum.a[i].prereq; rc = whereLoopInsert(pBuilder, pNew); } } } return rc;	< \|	4808 4809 4810 4811 4812 4813 4814 4815 4816 4817 4818 4819 4820 4821 4822	pNew->nLTerm = 1; pNew->aLTerm[0] = pTerm; pNew->wsFlags = WHERE_MULTI_OR; pNew->rSetup = 0; pNew->iSortIdx = 0; memset(&pNew->u, 0, sizeof(pNew->u)); for(i=0; rc==SQLITE_OK && i<sSum.n; i++){ pNew->rRun = sSum.a[i].rRun; pNew->nOut = sSum.a[i].nOut; pNew->prereq = sSum.a[i].prereq; rc = whereLoopInsert(pBuilder, pNew); } } } return rc;
︙			︙
5175 5176 5177 5178 5179 5180 5181 ~~5182~~ ~~5183 5184 5185 5186 5187 5188 5189 5190~~ 5191 ~~5192~~ 5193 ~~5194~~ 5195 ~~5196 5197~~ 5198 5199 5200 5201 5202 5203 5204	nOut = pFrom->nRow + pWLoop->nOut; maskNew = pFrom->maskLoop \| pWLoop->maskSelf; if( isOrdered<0 ){ isOrdered = wherePathSatisfiesOrderBy(pWInfo, pWInfo->pOrderBy, pFrom, pWInfo->wctrlFlags, iLoop, pWLoop, &revMask); if( isOrdered>=0 && isOrdered<nOrderBy ){ ~~/* TUNING: Estimated cost of sort~~ing~~ is ~~Nlog(N).~~~~ * If the order-by clause has X terms but only the last Y ~~terms~~ are out of order, then block-sorting will reduce the ~~sorting~~ cost to ~~Nlog(N)log(Y/X). The log(Y/X) term is computed~~ ~~by rScale.~~ TODO: Should the sorting cost get a small multiplier to help discourage the use of sorting and encourage the use of index ~~scans in~~st~~ead?~~ / LogEst rScale, rSortCost; ~~assert( nOrderBy>0 );~~ rScale = sqlite3LogEst((nOrderBy-isOrdered)100/nOrderBy) - 66; ~~rSortCost = nRowEst + estLog(nRowEst) + rScale;~~ /* TUNING: The cost of implementing DISTINCT using a B-TREE is ** a~~lso Nlog(N)~~ but ~~it has~~ a larger constant of proportionality. * Multiply by ~~3.0.~~ */ if( pWInfo->wctrlFlags & WHERE_WANT_DISTINCT ){ rSortCost += 16; } WHERETRACE(0x002, ("---- sort cost=%-3d (%d/%d) increases cost %3d to %-3d\n", rSortCost, (nOrderBy-isOrdered), nOrderBy, rCost, sqlite3LogEstAdd(rCost,rSortCost)));	\| > > > > \| \| \| \| < < \| \| > > \| \| > \| \|	5254 5255 5256 5257 5258 5259 5260 5261 5262 5263 5264 5265 5266 5267 5268 5269 5270 5271 5272 5273 5274 5275 5276 5277 5278 5279 5280 5281 5282 5283 5284 5285 5286 5287 5288	nOut = pFrom->nRow + pWLoop->nOut; maskNew = pFrom->maskLoop \| pWLoop->maskSelf; if( isOrdered<0 ){ isOrdered = wherePathSatisfiesOrderBy(pWInfo, pWInfo->pOrderBy, pFrom, pWInfo->wctrlFlags, iLoop, pWLoop, &revMask); if( isOrdered>=0 && isOrdered<nOrderBy ){ /* TUNING: Estimated cost of a full external sort, where N is the number of rows to sort is: ** cost = (3.0 * N * log(N)). Or, if the order-by clause has X terms but only the last Y terms are out of order, then block-sorting will reduce the sorting cost to: cost = (3.0 * N * log(N)) * (Y/X) The (Y/X) term is implemented using stack variable rScale ** below. / LogEst rScale, rSortCost; assert( nOrderBy>0 && 66==sqlite3LogEst(100) ); rScale = sqlite3LogEst((nOrderBy-isOrdered)100/nOrderBy) - 66; rSortCost = nRowEst + estLog(nRowEst) + rScale + 16; /* TUNING: The cost of implementing DISTINCT using a B-TREE is similar but with a larger constant of proportionality. Multiply by an additional factor of 3.0. */ if( pWInfo->wctrlFlags & WHERE_WANT_DISTINCT ){ rSortCost += 16; } WHERETRACE(0x002, ("---- sort cost=%-3d (%d/%d) increases cost %3d to %-3d\n", rSortCost, (nOrderBy-isOrdered), nOrderBy, rCost, sqlite3LogEstAdd(rCost,rSortCost)));
︙			︙

︙			︙
10 11 12 13 14 15 16 17 18 19 20 21 22 23	#*********************************************************************** # # Test cases for query planning decisions and the unlikely() and # likelihood() functions. set testdir [file dirname $argv0] source $testdir/tester.tcl do_execsql_test whereG-1.0 { CREATE TABLE composer( cid INTEGER PRIMARY KEY, cname TEXT ); CREATE TABLE album(	>	10 11 12 13 14 15 16 17 18 19 20 21 22 23 24	#*********************************************************************** # # Test cases for query planning decisions and the unlikely() and # likelihood() functions. set testdir [file dirname $argv0] source $testdir/tester.tcl set testprefix whereG do_execsql_test whereG-1.0 { CREATE TABLE composer( cid INTEGER PRIMARY KEY, cname TEXT ); CREATE TABLE album(
︙			︙
175 176 177 178 179 180 181 ~~182~~ 183	INSERT INTO t4 VALUES('right'),('wrong'); SELECT DISTINCT x FROM (SELECT x FROM t4 GROUP BY x) WHERE x='right' ORDER BY x; } {right} finish_test	> > > \| > > > > > > > > > > > > > > > > > > > > > > > > > > > > > > > > > > > > > >	176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225	INSERT INTO t4 VALUES('right'),('wrong'); SELECT DISTINCT x FROM (SELECT x FROM t4 GROUP BY x) WHERE x='right' ORDER BY x; } {right} #------------------------------------------------------------------------- # Test that likelihood() specifications on indexed terms are taken into # account by various forms of loops. # # 5.1.: open ended range scans # 5.2.: skip-scans # reset_db do_execsql_test 5.1 { CREATE TABLE t1(a, b, c); CREATE INDEX i1 ON t1(a, b); } do_eqp_test 5.1.2 { SELECT * FROM t1 WHERE a>? } {0 0 0 {SEARCH TABLE t1 USING INDEX i1 (a>?)}} do_eqp_test 5.1.3 { SELECT * FROM t1 WHERE likelihood(a>?, 0.9) } {0 0 0 {SCAN TABLE t1}} do_test 5.2 { for {set i 0} {$i < 100} {incr i} { execsql { INSERT INTO t1 VALUES('abc', $i, $i); } } execsql { INSERT INTO t1 SELECT 'def', b, c FROM t1; } execsql { ANALYZE } } {} do_eqp_test 5.2.2 { SELECT * FROM t1 WHERE likelihood(b>?, 0.01) } {0 0 0 {SEARCH TABLE t1 USING INDEX i1 (ANY(a) AND b>?)}} do_eqp_test 5.2.3 { SELECT * FROM t1 WHERE likelihood(b>?, 0.9) } {0 0 0 {SCAN TABLE t1}} do_eqp_test 5.3.1 { SELECT * FROM t1 WHERE a=? } {0 0 0 {SEARCH TABLE t1 USING INDEX i1 (a=?)}} do_eqp_test 5.3.2 { SELECT * FROM t1 WHERE likelihood(a=?, 0.9) } {0 0 0 {SCAN TABLE t1}} finish_test

︙			︙
79 80 81 82 83 84 85 86 87 88 89 90 91 92 93	return (n+8)>>(3-x); } static LogEst logEstFromDouble(double x){ sqlite3_uint64 a; LogEst e; assert( sizeof(x)==8 && sizeof(a)==8 ); if( x<=0.0 ) return -32768; ~~if( x<~~1.0~~ ) return -logEstFromDouble(1/x);~~ if( x<1024.0 ) return logEstFromInteger((sqlite3_uint64)(1024.0x)) - 100; if( x<=2000000000.0 ) return logEstFromInteger((sqlite3_uint64)x); memcpy(&a, &x, 8); e = (a>>52) - 1022; return e10; }	\| >	79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94	return (n+8)>>(3-x); } static LogEst logEstFromDouble(double x){ sqlite3_uint64 a; LogEst e; assert( sizeof(x)==8 && sizeof(a)==8 ); if( x<=0.0 ) return -32768; if( x<0.01 ) return -logEstFromDouble(1.0/x); if( x<1.0 ) return logEstFromDouble(100.0x) - 66; if( x<1024.0 ) return logEstFromInteger((sqlite3_uint64)(1024.0x)) - 100; if( x<=2000000000.0 ) return logEstFromInteger((sqlite3_uint64)x); memcpy(&a, &x, 8); e = (a>>52) - 1022; return e*10; }
︙			︙
152 153 154 155 156 157 158 ~~159~~ 160 161 162 163 164 165 166 167	}else if( isFloat(z) && z[0]!='-' ){ a[n++] = logEstFromDouble(atof(z)); }else{ showHelp(argv[0]); } } for(i=n-1; i>=0; i--){ ~~if( a[i]<0 ){~~ printf("%5d (%f)\n", a[i], 1.0/(double)logEstToInt(-a[i])); }else{ sqlite3_uint64 x = logEstToInt(a[i]+100)*100/1024; printf("%5d (%lld.%02lld)\n", a[i], x/100, x%100); } } return 0; }	\| > >	153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170	}else if( isFloat(z) && z[0]!='-' ){ a[n++] = logEstFromDouble(atof(z)); }else{ showHelp(argv[0]); } } for(i=n-1; i>=0; i--){ if( a[i]<-40 ){ printf("%5d (%f)\n", a[i], 1.0/(double)logEstToInt(-a[i])); }else if( a[i]<10 ){ printf("%5d (%f)\n", a[i], logEstToInt(a[i]+100)/1024.0); }else{ sqlite3_uint64 x = logEstToInt(a[i]+100)*100/1024; printf("%5d (%lld.%02lld)\n", a[i], x/100, x%100); } } return 0; }