1 /* 2 ** 2008 August 05 3 ** 4 ** The author disclaims copyright to this source code. In place of 5 ** a legal notice, here is a blessing: 6 ** 7 ** May you do good and not evil. 8 ** May you find forgiveness for yourself and forgive others. 9 ** May you share freely, never taking more than you give. 10 ** 11 ************************************************************************* 12 ** This file implements that page cache. 13 ** 14 ** @(#) $Id: pcache.c,v 1.45 2009/07/16 18:21:18 drh Exp $ 15 */ 16 #include "sqliteInt.h" 17 18 /* 19 ** A complete page cache is an instance of this structure. 20 */ 21 struct PCache { 22 PgHdr *pDirty, *pDirtyTail; /* List of dirty pages in LRU order */ 23 PgHdr *pSynced; /* Last synced page in dirty page list */ 24 int nRef; /* Number of referenced pages */ 25 int nMax; /* Configured cache size */ 26 int szPage; /* Size of every page in this cache */ 27 int szExtra; /* Size of extra space for each page */ 28 int bPurgeable; /* True if pages are on backing store */ 29 int (*xStress)(void*,PgHdr*); /* Call to try make a page clean */ 30 void *pStress; /* Argument to xStress */ 31 sqlite3_pcache *pCache; /* Pluggable cache module */ 32 PgHdr *pPage1; /* Reference to page 1 */ 33 }; 34 35 /* 36 ** Some of the assert() macros in this code are too expensive to run 37 ** even during normal debugging. Use them only rarely on long-running 38 ** tests. Enable the expensive asserts using the 39 ** -DSQLITE_ENABLE_EXPENSIVE_ASSERT=1 compile-time option. 40 */ 41 #ifdef SQLITE_ENABLE_EXPENSIVE_ASSERT 42 # define expensive_assert(X) assert(X) 43 #else 44 # define expensive_assert(X) 45 #endif 46 47 /********************************** Linked List Management ********************/ 48 49 #if !defined(NDEBUG) && defined(SQLITE_ENABLE_EXPENSIVE_ASSERT) 50 /* 51 ** Check that the pCache->pSynced variable is set correctly. If it 52 ** is not, either fail an assert or return zero. Otherwise, return 53 ** non-zero. This is only used in debugging builds, as follows: 54 ** 55 ** expensive_assert( pcacheCheckSynced(pCache) ); 56 */ 57 static int pcacheCheckSynced(PCache *pCache){ 58 PgHdr *p; 59 for(p=pCache->pDirtyTail; p!=pCache->pSynced; p=p->pDirtyPrev){ 60 assert( p->nRef || (p->flags&PGHDR_NEED_SYNC) ); 61 } 62 return (p==0 || p->nRef || (p->flags&PGHDR_NEED_SYNC)==0); 63 } 64 #endif /* !NDEBUG && SQLITE_ENABLE_EXPENSIVE_ASSERT */ 65 66 /* 67 ** Remove page pPage from the list of dirty pages. 68 */ 69 static void pcacheRemoveFromDirtyList(PgHdr *pPage){ 70 PCache *p = pPage->pCache; 71 72 assert( pPage->pDirtyNext || pPage==p->pDirtyTail ); 73 assert( pPage->pDirtyPrev || pPage==p->pDirty ); 74 75 /* Update the PCache1.pSynced variable if necessary. */ 76 if( p->pSynced==pPage ){ 77 PgHdr *pSynced = pPage->pDirtyPrev; 78 while( pSynced && (pSynced->flags&PGHDR_NEED_SYNC) ){ 79 pSynced = pSynced->pDirtyPrev; 80 } 81 p->pSynced = pSynced; 82 } 83 84 if( pPage->pDirtyNext ){ 85 pPage->pDirtyNext->pDirtyPrev = pPage->pDirtyPrev; 86 }else{ 87 assert( pPage==p->pDirtyTail ); 88 p->pDirtyTail = pPage->pDirtyPrev; 89 } 90 if( pPage->pDirtyPrev ){ 91 pPage->pDirtyPrev->pDirtyNext = pPage->pDirtyNext; 92 }else{ 93 assert( pPage==p->pDirty ); 94 p->pDirty = pPage->pDirtyNext; 95 } 96 pPage->pDirtyNext = 0; 97 pPage->pDirtyPrev = 0; 98 99 expensive_assert( pcacheCheckSynced(p) ); 100 } 101 102 /* 103 ** Add page pPage to the head of the dirty list (PCache1.pDirty is set to 104 ** pPage). 105 */ 106 static void pcacheAddToDirtyList(PgHdr *pPage){ 107 PCache *p = pPage->pCache; 108 109 assert( pPage->pDirtyNext==0 && pPage->pDirtyPrev==0 && p->pDirty!=pPage ); 110 111 pPage->pDirtyNext = p->pDirty; 112 if( pPage->pDirtyNext ){ 113 assert( pPage->pDirtyNext->pDirtyPrev==0 ); 114 pPage->pDirtyNext->pDirtyPrev = pPage; 115 } 116 p->pDirty = pPage; 117 if( !p->pDirtyTail ){ 118 p->pDirtyTail = pPage; 119 } 120 if( !p->pSynced && 0==(pPage->flags&PGHDR_NEED_SYNC) ){ 121 p->pSynced = pPage; 122 } 123 expensive_assert( pcacheCheckSynced(p) ); 124 } 125 126 /* 127 ** Wrapper around the pluggable caches xUnpin method. If the cache is 128 ** being used for an in-memory database, this function is a no-op. 129 */ 130 static void pcacheUnpin(PgHdr *p){ 131 PCache *pCache = p->pCache; 132 if( pCache->bPurgeable ){ 133 if( p->pgno==1 ){ 134 pCache->pPage1 = 0; 135 } 136 sqlite3GlobalConfig.pcache.xUnpin(pCache->pCache, p, 0); 137 } 138 } 139 140 /*************************************************** General Interfaces ****** 141 ** 142 ** Initialize and shutdown the page cache subsystem. Neither of these 143 ** functions are threadsafe. 144 */ 145 int sqlite3PcacheInitialize(void){ 146 if( sqlite3GlobalConfig.pcache.xInit==0 ){ 147 sqlite3PCacheSetDefault(); 148 } 149 return sqlite3GlobalConfig.pcache.xInit(sqlite3GlobalConfig.pcache.pArg); 150 } 151 void sqlite3PcacheShutdown(void){ 152 if( sqlite3GlobalConfig.pcache.xShutdown ){ 153 sqlite3GlobalConfig.pcache.xShutdown(sqlite3GlobalConfig.pcache.pArg); 154 } 155 } 156 157 /* 158 ** Return the size in bytes of a PCache object. 159 */ 160 int sqlite3PcacheSize(void){ return sizeof(PCache); } 161 162 /* 163 ** Create a new PCache object. Storage space to hold the object 164 ** has already been allocated and is passed in as the p pointer. 165 ** The caller discovers how much space needs to be allocated by 166 ** calling sqlite3PcacheSize(). 167 */ 168 void sqlite3PcacheOpen( 169 int szPage, /* Size of every page */ 170 int szExtra, /* Extra space associated with each page */ 171 int bPurgeable, /* True if pages are on backing store */ 172 int (*xStress)(void*,PgHdr*),/* Call to try to make pages clean */ 173 void *pStress, /* Argument to xStress */ 174 PCache *p /* Preallocated space for the PCache */ 175 ){ 176 memset(p, 0, sizeof(PCache)); 177 p->szPage = szPage; 178 p->szExtra = szExtra; 179 p->bPurgeable = bPurgeable; 180 p->xStress = xStress; 181 p->pStress = pStress; 182 p->nMax = 100; 183 } 184 185 /* 186 ** Change the page size for PCache object. The caller must ensure that there 187 ** are no outstanding page references when this function is called. 188 */ 189 void sqlite3PcacheSetPageSize(PCache *pCache, int szPage){ 190 assert( pCache->nRef==0 && pCache->pDirty==0 ); 191 if( pCache->pCache ){ 192 sqlite3GlobalConfig.pcache.xDestroy(pCache->pCache); 193 pCache->pCache = 0; 194 } 195 pCache->szPage = szPage; 196 } 197 198 /* 199 ** Try to obtain a page from the cache. 200 */ 201 int sqlite3PcacheFetch( 202 PCache *pCache, /* Obtain the page from this cache */ 203 Pgno pgno, /* Page number to obtain */ 204 int createFlag, /* If true, create page if it does not exist already */ 205 PgHdr **ppPage /* Write the page here */ 206 ){ 207 PgHdr *pPage = 0; 208 int eCreate; 209 210 assert( pCache!=0 ); 211 assert( pgno>0 ); 212 213 /* If the pluggable cache (sqlite3_pcache*) has not been allocated, 214 ** allocate it now. 215 */ 216 if( !pCache->pCache && createFlag ){ 217 sqlite3_pcache *p; 218 int nByte; 219 nByte = pCache->szPage + pCache->szExtra + sizeof(PgHdr); 220 p = sqlite3GlobalConfig.pcache.xCreate(nByte, pCache->bPurgeable); 221 if( !p ){ 222 return SQLITE_NOMEM; 223 } 224 sqlite3GlobalConfig.pcache.xCachesize(p, pCache->nMax); 225 pCache->pCache = p; 226 } 227 228 eCreate = createFlag ? 1 : 0; 229 if( eCreate && (!pCache->bPurgeable || !pCache->pDirty) ){ 230 eCreate = 2; 231 } 232 if( pCache->pCache ){ 233 pPage = sqlite3GlobalConfig.pcache.xFetch(pCache->pCache, pgno, eCreate); 234 } 235 236 if( !pPage && eCreate==1 ){ 237 PgHdr *pPg; 238 239 /* Find a dirty page to write-out and recycle. First try to find a 240 ** page that does not require a journal-sync (one with PGHDR_NEED_SYNC 241 ** cleared), but if that is not possible settle for any other 242 ** unreferenced dirty page. 243 */ 244 expensive_assert( pcacheCheckSynced(pCache) ); 245 for(pPg=pCache->pSynced; 246 pPg && (pPg->nRef || (pPg->flags&PGHDR_NEED_SYNC)); 247 pPg=pPg->pDirtyPrev 248 ); 249 if( !pPg ){ 250 for(pPg=pCache->pDirtyTail; pPg && pPg->nRef; pPg=pPg->pDirtyPrev); 251 } 252 if( pPg ){ 253 int rc; 254 rc = pCache->xStress(pCache->pStress, pPg); 255 if( rc!=SQLITE_OK && rc!=SQLITE_BUSY ){ 256 return rc; 257 } 258 } 259 260 pPage = sqlite3GlobalConfig.pcache.xFetch(pCache->pCache, pgno, 2); 261 } 262 263 if( pPage ){ 264 if( !pPage->pData ){ 265 memset(pPage, 0, sizeof(PgHdr) + pCache->szExtra); 266 pPage->pExtra = (void*)&pPage[1]; 267 pPage->pData = (void *)&((char *)pPage)[sizeof(PgHdr) + pCache->szExtra]; 268 pPage->pCache = pCache; 269 pPage->pgno = pgno; 270 } 271 assert( pPage->pCache==pCache ); 272 assert( pPage->pgno==pgno ); 273 assert( pPage->pExtra==(void *)&pPage[1] ); 274 275 if( 0==pPage->nRef ){ 276 pCache->nRef++; 277 } 278 pPage->nRef++; 279 if( pgno==1 ){ 280 pCache->pPage1 = pPage; 281 } 282 } 283 *ppPage = pPage; 284 return (pPage==0 && eCreate) ? SQLITE_NOMEM : SQLITE_OK; 285 } 286 287 /* 288 ** Decrement the reference count on a page. If the page is clean and the 289 ** reference count drops to 0, then it is made elible for recycling. 290 */ 291 void sqlite3PcacheRelease(PgHdr *p){ 292 assert( p->nRef>0 ); 293 p->nRef--; 294 if( p->nRef==0 ){ 295 PCache *pCache = p->pCache; 296 pCache->nRef--; 297 if( (p->flags&PGHDR_DIRTY)==0 ){ 298 pcacheUnpin(p); 299 }else{ 300 /* Move the page to the head of the dirty list. */ 301 pcacheRemoveFromDirtyList(p); 302 pcacheAddToDirtyList(p); 303 } 304 } 305 } 306 307 /* 308 ** Increase the reference count of a supplied page by 1. 309 */ 310 void sqlite3PcacheRef(PgHdr *p){ 311 assert(p->nRef>0); 312 p->nRef++; 313 } 314 315 /* 316 ** Drop a page from the cache. There must be exactly one reference to the 317 ** page. This function deletes that reference, so after it returns the 318 ** page pointed to by p is invalid. 319 */ 320 void sqlite3PcacheDrop(PgHdr *p){ 321 PCache *pCache; 322 assert( p->nRef==1 ); 323 if( p->flags&PGHDR_DIRTY ){ 324 pcacheRemoveFromDirtyList(p); 325 } 326 pCache = p->pCache; 327 pCache->nRef--; 328 if( p->pgno==1 ){ 329 pCache->pPage1 = 0; 330 } 331 sqlite3GlobalConfig.pcache.xUnpin(pCache->pCache, p, 1); 332 } 333 334 /* 335 ** Make sure the page is marked as dirty. If it isn't dirty already, 336 ** make it so. 337 */ 338 void sqlite3PcacheMakeDirty(PgHdr *p){ 339 p->flags &= ~PGHDR_DONT_WRITE; 340 assert( p->nRef>0 ); 341 if( 0==(p->flags & PGHDR_DIRTY) ){ 342 p->flags |= PGHDR_DIRTY; 343 pcacheAddToDirtyList( p); 344 } 345 } 346 347 /* 348 ** Make sure the page is marked as clean. If it isn't clean already, 349 ** make it so. 350 */ 351 void sqlite3PcacheMakeClean(PgHdr *p){ 352 if( (p->flags & PGHDR_DIRTY) ){ 353 pcacheRemoveFromDirtyList(p); 354 p->flags &= ~(PGHDR_DIRTY|PGHDR_NEED_SYNC); 355 if( p->nRef==0 ){ 356 pcacheUnpin(p); 357 } 358 } 359 } 360 361 /* 362 ** Make every page in the cache clean. 363 */ 364 void sqlite3PcacheCleanAll(PCache *pCache){ 365 PgHdr *p; 366 while( (p = pCache->pDirty)!=0 ){ 367 sqlite3PcacheMakeClean(p); 368 } 369 } 370 371 /* 372 ** Clear the PGHDR_NEED_SYNC flag from all dirty pages. 373 */ 374 void sqlite3PcacheClearSyncFlags(PCache *pCache){ 375 PgHdr *p; 376 for(p=pCache->pDirty; p; p=p->pDirtyNext){ 377 p->flags &= ~PGHDR_NEED_SYNC; 378 } 379 pCache->pSynced = pCache->pDirtyTail; 380 } 381 382 /* 383 ** Change the page number of page p to newPgno. 384 */ 385 void sqlite3PcacheMove(PgHdr *p, Pgno newPgno){ 386 PCache *pCache = p->pCache; 387 assert( p->nRef>0 ); 388 assert( newPgno>0 ); 389 sqlite3GlobalConfig.pcache.xRekey(pCache->pCache, p, p->pgno, newPgno); 390 p->pgno = newPgno; 391 if( (p->flags&PGHDR_DIRTY) && (p->flags&PGHDR_NEED_SYNC) ){ 392 pcacheRemoveFromDirtyList(p); 393 pcacheAddToDirtyList(p); 394 } 395 } 396 397 /* 398 ** Drop every cache entry whose page number is greater than "pgno". The 399 ** caller must ensure that there are no outstanding references to any pages 400 ** other than page 1 with a page number greater than pgno. 401 ** 402 ** If there is a reference to page 1 and the pgno parameter passed to this 403 ** function is 0, then the data area associated with page 1 is zeroed, but 404 ** the page object is not dropped. 405 */ 406 void sqlite3PcacheTruncate(PCache *pCache, Pgno pgno){ 407 if( pCache->pCache ){ 408 PgHdr *p; 409 PgHdr *pNext; 410 for(p=pCache->pDirty; p; p=pNext){ 411 pNext = p->pDirtyNext; 412 if( p->pgno>pgno ){ 413 assert( p->flags&PGHDR_DIRTY ); 414 sqlite3PcacheMakeClean(p); 415 } 416 } 417 if( pgno==0 && pCache->pPage1 ){ 418 memset(pCache->pPage1->pData, 0, pCache->szPage); 419 pgno = 1; 420 } 421 sqlite3GlobalConfig.pcache.xTruncate(pCache->pCache, pgno+1); 422 } 423 } 424 425 /* 426 ** Close a cache. 427 */ 428 void sqlite3PcacheClose(PCache *pCache){ 429 if( pCache->pCache ){ 430 sqlite3GlobalConfig.pcache.xDestroy(pCache->pCache); 431 } 432 } 433 434 /* 435 ** Discard the contents of the cache. 436 */ 437 void sqlite3PcacheClear(PCache *pCache){ 438 sqlite3PcacheTruncate(pCache, 0); 439 } 440 441 /* 442 ** Merge two lists of pages connected by pDirty and in pgno order. 443 ** Do not both fixing the pDirtyPrev pointers. 444 */ 445 static PgHdr *pcacheMergeDirtyList(PgHdr *pA, PgHdr *pB){ 446 PgHdr result, *pTail; 447 pTail = &result; 448 while( pA && pB ){ 449 if( pA->pgno<pB->pgno ){ 450 pTail->pDirty = pA; 451 pTail = pA; 452 pA = pA->pDirty; 453 }else{ 454 pTail->pDirty = pB; 455 pTail = pB; 456 pB = pB->pDirty; 457 } 458 } 459 if( pA ){ 460 pTail->pDirty = pA; 461 }else if( pB ){ 462 pTail->pDirty = pB; 463 }else{ 464 pTail->pDirty = 0; 465 } 466 return result.pDirty; 467 } 468 469 /* 470 ** Sort the list of pages in accending order by pgno. Pages are 471 ** connected by pDirty pointers. The pDirtyPrev pointers are 472 ** corrupted by this sort. 473 ** 474 ** Since there cannot be more than 2^31 distinct pages in a database, 475 ** there cannot be more than 31 buckets required by the merge sorter. 476 ** One extra bucket is added to catch overflow in case something 477 ** ever changes to make the previous sentence incorrect. 478 */ 479 #define N_SORT_BUCKET 32 480 static PgHdr *pcacheSortDirtyList(PgHdr *pIn){ 481 PgHdr *a[N_SORT_BUCKET], *p; 482 int i; 483 memset(a, 0, sizeof(a)); 484 while( pIn ){ 485 p = pIn; 486 pIn = p->pDirty; 487 p->pDirty = 0; 488 for(i=0; ALWAYS(i<N_SORT_BUCKET-1); i++){ 489 if( a[i]==0 ){ 490 a[i] = p; 491 break; 492 }else{ 493 p = pcacheMergeDirtyList(a[i], p); 494 a[i] = 0; 495 } 496 } 497 if( NEVER(i==N_SORT_BUCKET-1) ){ 498 /* To get here, there need to be 2^(N_SORT_BUCKET) elements in 499 ** the input list. But that is impossible. 500 */ 501 a[i] = pcacheMergeDirtyList(a[i], p); 502 } 503 } 504 p = a[0]; 505 for(i=1; i<N_SORT_BUCKET; i++){ 506 p = pcacheMergeDirtyList(p, a[i]); 507 } 508 return p; 509 } 510 511 /* 512 ** Return a list of all dirty pages in the cache, sorted by page number. 513 */ 514 PgHdr *sqlite3PcacheDirtyList(PCache *pCache){ 515 PgHdr *p; 516 for(p=pCache->pDirty; p; p=p->pDirtyNext){ 517 p->pDirty = p->pDirtyNext; 518 } 519 return pcacheSortDirtyList(pCache->pDirty); 520 } 521 522 /* 523 ** Return the total number of referenced pages held by the cache. 524 */ 525 int sqlite3PcacheRefCount(PCache *pCache){ 526 return pCache->nRef; 527 } 528 529 /* 530 ** Return the number of references to the page supplied as an argument. 531 */ 532 int sqlite3PcachePageRefcount(PgHdr *p){ 533 return p->nRef; 534 } 535 536 /* 537 ** Return the total number of pages in the cache. 538 */ 539 int sqlite3PcachePagecount(PCache *pCache){ 540 int nPage = 0; 541 if( pCache->pCache ){ 542 nPage = sqlite3GlobalConfig.pcache.xPagecount(pCache->pCache); 543 } 544 return nPage; 545 } 546 547 #ifdef SQLITE_TEST 548 /* 549 ** Get the suggested cache-size value. 550 */ 551 int sqlite3PcacheGetCachesize(PCache *pCache){ 552 return pCache->nMax; 553 } 554 #endif 555 556 /* 557 ** Set the suggested cache-size value. 558 */ 559 void sqlite3PcacheSetCachesize(PCache *pCache, int mxPage){ 560 pCache->nMax = mxPage; 561 if( pCache->pCache ){ 562 sqlite3GlobalConfig.pcache.xCachesize(pCache->pCache, mxPage); 563 } 564 } 565 566 #ifdef SQLITE_CHECK_PAGES 567 /* 568 ** For all dirty pages currently in the cache, invoke the specified 569 ** callback. This is only used if the SQLITE_CHECK_PAGES macro is 570 ** defined. 571 */ 572 void sqlite3PcacheIterateDirty(PCache *pCache, void (*xIter)(PgHdr *)){ 573 PgHdr *pDirty; 574 for(pDirty=pCache->pDirty; pDirty; pDirty=pDirty->pDirtyNext){ 575 xIter(pDirty); 576 } 577 } 578 #endif 579