blob: de332cba02d1ae6ad207b7acd7c4accb53fae8b5 [file] [log] [blame]
drhed7c8552001-04-11 14:29:21 +00001/*
drhb19a2bc2001-09-16 00:13:26 +00002** 2001 September 15
drhed7c8552001-04-11 14:29:21 +00003**
drhb19a2bc2001-09-16 00:13:26 +00004** The author disclaims copyright to this source code. In place of
5** a legal notice, here is a blessing:
drhed7c8552001-04-11 14:29:21 +00006**
drhb19a2bc2001-09-16 00:13:26 +00007** May you do good and not evil.
8** May you find forgiveness for yourself and forgive others.
9** May you share freely, never taking more than you give.
drhed7c8552001-04-11 14:29:21 +000010**
11*************************************************************************
drhb19a2bc2001-09-16 00:13:26 +000012** This is the implementation of the page cache subsystem or "pager".
drhed7c8552001-04-11 14:29:21 +000013**
drhb19a2bc2001-09-16 00:13:26 +000014** The pager is used to access a database disk file. It implements
15** atomic commit and rollback through the use of a journal file that
16** is separate from the database file. The pager also implements file
17** locking to prevent two processes from writing the same database
18** file simultaneously, or one process from reading the database while
19** another is writing.
drhed7c8552001-04-11 14:29:21 +000020**
drh603240c2002-03-05 01:11:12 +000021** @(#) $Id: pager.c,v 1.42 2002/03/05 01:11:14 drh Exp $
drhed7c8552001-04-11 14:29:21 +000022*/
drhd9b02572001-04-15 00:37:09 +000023#include "sqliteInt.h"
drhed7c8552001-04-11 14:29:21 +000024#include "pager.h"
drh8cfbf082001-09-19 13:22:39 +000025#include "os.h"
drhed7c8552001-04-11 14:29:21 +000026#include <assert.h>
drhd9b02572001-04-15 00:37:09 +000027#include <string.h>
drhed7c8552001-04-11 14:29:21 +000028
29/*
30** The page cache as a whole is always in one of the following
31** states:
32**
33** SQLITE_UNLOCK The page cache is not currently reading or
34** writing the database file. There is no
35** data held in memory. This is the initial
36** state.
37**
38** SQLITE_READLOCK The page cache is reading the database.
39** Writing is not permitted. There can be
40** multiple readers accessing the same database
drh69688d52001-04-14 16:38:23 +000041** file at the same time.
drhed7c8552001-04-11 14:29:21 +000042**
43** SQLITE_WRITELOCK The page cache is writing the database.
44** Access is exclusive. No other processes or
45** threads can be reading or writing while one
46** process is writing.
47**
drh306dc212001-05-21 13:45:10 +000048** The page cache comes up in SQLITE_UNLOCK. The first time a
49** sqlite_page_get() occurs, the state transitions to SQLITE_READLOCK.
drhed7c8552001-04-11 14:29:21 +000050** After all pages have been released using sqlite_page_unref(),
drh306dc212001-05-21 13:45:10 +000051** the state transitions back to SQLITE_UNLOCK. The first time
drhed7c8552001-04-11 14:29:21 +000052** that sqlite_page_write() is called, the state transitions to
drh306dc212001-05-21 13:45:10 +000053** SQLITE_WRITELOCK. (Note that sqlite_page_write() can only be
54** called on an outstanding page which means that the pager must
55** be in SQLITE_READLOCK before it transitions to SQLITE_WRITELOCK.)
56** The sqlite_page_rollback() and sqlite_page_commit() functions
57** transition the state from SQLITE_WRITELOCK back to SQLITE_READLOCK.
drhed7c8552001-04-11 14:29:21 +000058*/
59#define SQLITE_UNLOCK 0
60#define SQLITE_READLOCK 1
61#define SQLITE_WRITELOCK 2
62
drhd9b02572001-04-15 00:37:09 +000063
drhed7c8552001-04-11 14:29:21 +000064/*
65** Each in-memory image of a page begins with the following header.
drhbd03cae2001-06-02 02:40:57 +000066** This header is only visible to this pager module. The client
67** code that calls pager sees only the data that follows the header.
drhed7c8552001-04-11 14:29:21 +000068*/
drhd9b02572001-04-15 00:37:09 +000069typedef struct PgHdr PgHdr;
drhed7c8552001-04-11 14:29:21 +000070struct PgHdr {
71 Pager *pPager; /* The pager to which this page belongs */
72 Pgno pgno; /* The page number for this page */
drh69688d52001-04-14 16:38:23 +000073 PgHdr *pNextHash, *pPrevHash; /* Hash collision chain for PgHdr.pgno */
drhed7c8552001-04-11 14:29:21 +000074 int nRef; /* Number of users of this page */
drhd9b02572001-04-15 00:37:09 +000075 PgHdr *pNextFree, *pPrevFree; /* Freelist of pages where nRef==0 */
76 PgHdr *pNextAll, *pPrevAll; /* A list of all pages */
drhed7c8552001-04-11 14:29:21 +000077 char inJournal; /* TRUE if has been written to journal */
drhfa86c412002-02-02 15:01:15 +000078 char inCkpt; /* TRUE if written to the checkpoint journal */
drhed7c8552001-04-11 14:29:21 +000079 char dirty; /* TRUE if we need to write back changes */
drh69688d52001-04-14 16:38:23 +000080 /* SQLITE_PAGE_SIZE bytes of page data follow this header */
drh7e3b0a02001-04-28 16:52:40 +000081 /* Pager.nExtra bytes of local data follow the page data */
drhed7c8552001-04-11 14:29:21 +000082};
83
84/*
drh69688d52001-04-14 16:38:23 +000085** Convert a pointer to a PgHdr into a pointer to its data
86** and back again.
drhed7c8552001-04-11 14:29:21 +000087*/
88#define PGHDR_TO_DATA(P) ((void*)(&(P)[1]))
89#define DATA_TO_PGHDR(D) (&((PgHdr*)(D))[-1])
drh7e3b0a02001-04-28 16:52:40 +000090#define PGHDR_TO_EXTRA(P) ((void*)&((char*)(&(P)[1]))[SQLITE_PAGE_SIZE])
drhed7c8552001-04-11 14:29:21 +000091
92/*
drhed7c8552001-04-11 14:29:21 +000093** How big to make the hash table used for locating in-memory pages
drh306dc212001-05-21 13:45:10 +000094** by page number. Knuth says this should be a prime number.
drhed7c8552001-04-11 14:29:21 +000095*/
drh603240c2002-03-05 01:11:12 +000096#define N_PG_HASH 2003
drhed7c8552001-04-11 14:29:21 +000097
98/*
99** A open page cache is an instance of the following structure.
100*/
101struct Pager {
102 char *zFilename; /* Name of the database file */
103 char *zJournal; /* Name of the journal file */
drh8cfbf082001-09-19 13:22:39 +0000104 OsFile fd, jfd; /* File descriptors for database and journal */
drhfa86c412002-02-02 15:01:15 +0000105 OsFile cpfd; /* File descriptor for the checkpoint journal */
drhed7c8552001-04-11 14:29:21 +0000106 int dbSize; /* Number of pages in the file */
drh69688d52001-04-14 16:38:23 +0000107 int origDbSize; /* dbSize before the current change */
drhfa86c412002-02-02 15:01:15 +0000108 int ckptSize, ckptJSize; /* Size of database and journal at ckpt_begin() */
drh7e3b0a02001-04-28 16:52:40 +0000109 int nExtra; /* Add this many bytes to each in-memory page */
drh72f82862001-05-24 21:06:34 +0000110 void (*xDestructor)(void*); /* Call this routine when freeing pages */
drhed7c8552001-04-11 14:29:21 +0000111 int nPage; /* Total number of in-memory pages */
drhd9b02572001-04-15 00:37:09 +0000112 int nRef; /* Number of in-memory pages with PgHdr.nRef>0 */
drhed7c8552001-04-11 14:29:21 +0000113 int mxPage; /* Maximum number of pages to hold in cache */
drhd9b02572001-04-15 00:37:09 +0000114 int nHit, nMiss, nOvfl; /* Cache hits, missing, and LRU overflows */
drh603240c2002-03-05 01:11:12 +0000115 u8 journalOpen; /* True if journal file descriptors is valid */
116 u8 ckptOpen; /* True if the checkpoint journal is open */
117 u8 noSync; /* Do not sync the journal if true */
118 u8 state; /* SQLITE_UNLOCK, _READLOCK or _WRITELOCK */
119 u8 errMask; /* One of several kinds of errors */
120 u8 tempFile; /* zFilename is a temporary file */
121 u8 readOnly; /* True for a read-only database */
122 u8 needSync; /* True if an fsync() is needed on the journal */
123 u8 *aInJournal; /* One bit for each page in the database file */
124 u8 *aInCkpt; /* One bit for each page in the database */
drhed7c8552001-04-11 14:29:21 +0000125 PgHdr *pFirst, *pLast; /* List of free pages */
drhd9b02572001-04-15 00:37:09 +0000126 PgHdr *pAll; /* List of all pages */
drhed7c8552001-04-11 14:29:21 +0000127 PgHdr *aHash[N_PG_HASH]; /* Hash table to map page number of PgHdr */
drhd9b02572001-04-15 00:37:09 +0000128};
129
130/*
131** These are bits that can be set in Pager.errMask.
132*/
133#define PAGER_ERR_FULL 0x01 /* a write() failed */
134#define PAGER_ERR_MEM 0x02 /* malloc() failed */
135#define PAGER_ERR_LOCK 0x04 /* error in the locking protocol */
136#define PAGER_ERR_CORRUPT 0x08 /* database or journal corruption */
drh81a20f22001-10-12 17:30:04 +0000137#define PAGER_ERR_DISK 0x10 /* general disk I/O error - bad hard drive? */
drhd9b02572001-04-15 00:37:09 +0000138
139/*
140** The journal file contains page records in the following
141** format.
142*/
143typedef struct PageRecord PageRecord;
144struct PageRecord {
145 Pgno pgno; /* The page number */
146 char aData[SQLITE_PAGE_SIZE]; /* Original data for page pgno */
147};
148
149/*
drh5e00f6c2001-09-13 13:46:56 +0000150** Journal files begin with the following magic string. The data
151** was obtained from /dev/random. It is used only as a sanity check.
drhd9b02572001-04-15 00:37:09 +0000152*/
153static const unsigned char aJournalMagic[] = {
154 0xd9, 0xd5, 0x05, 0xf9, 0x20, 0xa1, 0x63, 0xd4,
drhed7c8552001-04-11 14:29:21 +0000155};
156
157/*
158** Hash a page number
159*/
drhd9b02572001-04-15 00:37:09 +0000160#define pager_hash(PN) ((PN)%N_PG_HASH)
drhed7c8552001-04-11 14:29:21 +0000161
162/*
drhdd793422001-06-28 01:54:48 +0000163** Enable reference count tracking here:
164*/
165#if SQLITE_TEST
drh5e00f6c2001-09-13 13:46:56 +0000166 int pager_refinfo_enable = 0;
drhdd793422001-06-28 01:54:48 +0000167 static void pager_refinfo(PgHdr *p){
168 static int cnt = 0;
169 if( !pager_refinfo_enable ) return;
170 printf(
171 "REFCNT: %4d addr=0x%08x nRef=%d\n",
172 p->pgno, (int)PGHDR_TO_DATA(p), p->nRef
173 );
174 cnt++; /* Something to set a breakpoint on */
175 }
176# define REFINFO(X) pager_refinfo(X)
177#else
178# define REFINFO(X)
179#endif
180
181/*
drhd9b02572001-04-15 00:37:09 +0000182** Convert the bits in the pPager->errMask into an approprate
183** return code.
184*/
185static int pager_errcode(Pager *pPager){
186 int rc = SQLITE_OK;
187 if( pPager->errMask & PAGER_ERR_LOCK ) rc = SQLITE_PROTOCOL;
drh81a20f22001-10-12 17:30:04 +0000188 if( pPager->errMask & PAGER_ERR_DISK ) rc = SQLITE_IOERR;
drhd9b02572001-04-15 00:37:09 +0000189 if( pPager->errMask & PAGER_ERR_FULL ) rc = SQLITE_FULL;
190 if( pPager->errMask & PAGER_ERR_MEM ) rc = SQLITE_NOMEM;
191 if( pPager->errMask & PAGER_ERR_CORRUPT ) rc = SQLITE_CORRUPT;
192 return rc;
drhed7c8552001-04-11 14:29:21 +0000193}
194
195/*
196** Find a page in the hash table given its page number. Return
197** a pointer to the page or NULL if not found.
198*/
drhd9b02572001-04-15 00:37:09 +0000199static PgHdr *pager_lookup(Pager *pPager, Pgno pgno){
drhed7c8552001-04-11 14:29:21 +0000200 PgHdr *p = pPager->aHash[pgno % N_PG_HASH];
201 while( p && p->pgno!=pgno ){
202 p = p->pNextHash;
203 }
204 return p;
205}
206
207/*
208** Unlock the database and clear the in-memory cache. This routine
209** sets the state of the pager back to what it was when it was first
210** opened. Any outstanding pages are invalidated and subsequent attempts
211** to access those pages will likely result in a coredump.
212*/
drhd9b02572001-04-15 00:37:09 +0000213static void pager_reset(Pager *pPager){
drhed7c8552001-04-11 14:29:21 +0000214 PgHdr *pPg, *pNext;
drhd9b02572001-04-15 00:37:09 +0000215 for(pPg=pPager->pAll; pPg; pPg=pNext){
216 pNext = pPg->pNextAll;
217 sqliteFree(pPg);
drhed7c8552001-04-11 14:29:21 +0000218 }
219 pPager->pFirst = 0;
drhd9b02572001-04-15 00:37:09 +0000220 pPager->pLast = 0;
221 pPager->pAll = 0;
drhed7c8552001-04-11 14:29:21 +0000222 memset(pPager->aHash, 0, sizeof(pPager->aHash));
223 pPager->nPage = 0;
drhfa86c412002-02-02 15:01:15 +0000224 if( pPager->state>=SQLITE_WRITELOCK ){
drhd9b02572001-04-15 00:37:09 +0000225 sqlitepager_rollback(pPager);
drhed7c8552001-04-11 14:29:21 +0000226 }
drha7fcb052001-12-14 15:09:55 +0000227 sqliteOsUnlock(&pPager->fd);
drhed7c8552001-04-11 14:29:21 +0000228 pPager->state = SQLITE_UNLOCK;
drhd9b02572001-04-15 00:37:09 +0000229 pPager->dbSize = -1;
drhed7c8552001-04-11 14:29:21 +0000230 pPager->nRef = 0;
drh8cfbf082001-09-19 13:22:39 +0000231 assert( pPager->journalOpen==0 );
drhed7c8552001-04-11 14:29:21 +0000232}
233
234/*
235** When this routine is called, the pager has the journal file open and
236** a write lock on the database. This routine releases the database
237** write lock and acquires a read lock in its place. The journal file
238** is deleted and closed.
drhed7c8552001-04-11 14:29:21 +0000239*/
drhd9b02572001-04-15 00:37:09 +0000240static int pager_unwritelock(Pager *pPager){
drhed7c8552001-04-11 14:29:21 +0000241 int rc;
drhd9b02572001-04-15 00:37:09 +0000242 PgHdr *pPg;
drhfa86c412002-02-02 15:01:15 +0000243 if( pPager->state<SQLITE_WRITELOCK ) return SQLITE_OK;
drh663fc632002-02-02 18:49:19 +0000244 sqlitepager_ckpt_commit(pPager);
drha7fcb052001-12-14 15:09:55 +0000245 sqliteOsClose(&pPager->jfd);
drh8cfbf082001-09-19 13:22:39 +0000246 pPager->journalOpen = 0;
247 sqliteOsDelete(pPager->zJournal);
drha7fcb052001-12-14 15:09:55 +0000248 rc = sqliteOsReadLock(&pPager->fd);
249 assert( rc==SQLITE_OK );
drh6019e162001-07-02 17:51:45 +0000250 sqliteFree( pPager->aInJournal );
251 pPager->aInJournal = 0;
drhd9b02572001-04-15 00:37:09 +0000252 for(pPg=pPager->pAll; pPg; pPg=pPg->pNextAll){
253 pPg->inJournal = 0;
254 pPg->dirty = 0;
255 }
drha7fcb052001-12-14 15:09:55 +0000256 pPager->state = SQLITE_READLOCK;
drhed7c8552001-04-11 14:29:21 +0000257 return rc;
258}
259
drhed7c8552001-04-11 14:29:21 +0000260/*
drhfa86c412002-02-02 15:01:15 +0000261** Read a single page from the journal file opened on file descriptor
262** jfd. Playback this one page.
263*/
264static int pager_playback_one_page(Pager *pPager, OsFile *jfd){
265 int rc;
266 PgHdr *pPg; /* An existing page in the cache */
267 PageRecord pgRec;
268
drh663fc632002-02-02 18:49:19 +0000269 rc = sqliteOsRead(jfd, &pgRec, sizeof(pgRec));
drhfa86c412002-02-02 15:01:15 +0000270 if( rc!=SQLITE_OK ) return rc;
271
272 /* Sanity checking on the page */
273 if( pgRec.pgno>pPager->dbSize || pgRec.pgno==0 ) return SQLITE_CORRUPT;
274
275 /* Playback the page. Update the in-memory copy of the page
276 ** at the same time, if there is one.
277 */
278 pPg = pager_lookup(pPager, pgRec.pgno);
279 if( pPg ){
280 memcpy(PGHDR_TO_DATA(pPg), pgRec.aData, SQLITE_PAGE_SIZE);
281 memset(PGHDR_TO_EXTRA(pPg), 0, pPager->nExtra);
282 }
283 rc = sqliteOsSeek(&pPager->fd, (pgRec.pgno-1)*SQLITE_PAGE_SIZE);
284 if( rc==SQLITE_OK ){
285 rc = sqliteOsWrite(&pPager->fd, pgRec.aData, SQLITE_PAGE_SIZE);
286 }
287 return rc;
288}
289
290/*
drhed7c8552001-04-11 14:29:21 +0000291** Playback the journal and thus restore the database file to
292** the state it was in before we started making changes.
293**
drhd9b02572001-04-15 00:37:09 +0000294** The journal file format is as follows: There is an initial
295** file-type string for sanity checking. Then there is a single
296** Pgno number which is the number of pages in the database before
297** changes were made. The database is truncated to this size.
drh306dc212001-05-21 13:45:10 +0000298** Next come zero or more page records where each page record
299** consists of a Pgno and SQLITE_PAGE_SIZE bytes of data. See
300** the PageRecord structure for details.
drhed7c8552001-04-11 14:29:21 +0000301**
drhd9b02572001-04-15 00:37:09 +0000302** If the file opened as the journal file is not a well-formed
303** journal file (as determined by looking at the magic number
304** at the beginning) then this routine returns SQLITE_PROTOCOL.
305** If any other errors occur during playback, the database will
306** likely be corrupted, so the PAGER_ERR_CORRUPT bit is set in
307** pPager->errMask and SQLITE_CORRUPT is returned. If it all
308** works, then this routine returns SQLITE_OK.
drhed7c8552001-04-11 14:29:21 +0000309*/
drhd9b02572001-04-15 00:37:09 +0000310static int pager_playback(Pager *pPager){
311 int nRec; /* Number of Records */
312 int i; /* Loop counter */
313 Pgno mxPg = 0; /* Size of the original file in pages */
drhd9b02572001-04-15 00:37:09 +0000314 unsigned char aMagic[sizeof(aJournalMagic)];
drhed7c8552001-04-11 14:29:21 +0000315 int rc;
316
drhc3a64ba2001-11-22 00:01:27 +0000317 /* Figure out how many records are in the journal. Abort early if
318 ** the journal is empty.
drhed7c8552001-04-11 14:29:21 +0000319 */
drh8cfbf082001-09-19 13:22:39 +0000320 assert( pPager->journalOpen );
drha7fcb052001-12-14 15:09:55 +0000321 sqliteOsSeek(&pPager->jfd, 0);
322 rc = sqliteOsFileSize(&pPager->jfd, &nRec);
drhc3a64ba2001-11-22 00:01:27 +0000323 if( rc!=SQLITE_OK ){
324 goto end_playback;
325 }
326 nRec = (nRec - (sizeof(aMagic)+sizeof(Pgno))) / sizeof(PageRecord);
327 if( nRec<=0 ){
328 goto end_playback;
329 }
330
331 /* Read the beginning of the journal and truncate the
332 ** database file back to its original size.
333 */
drha7fcb052001-12-14 15:09:55 +0000334 rc = sqliteOsRead(&pPager->jfd, aMagic, sizeof(aMagic));
drhd9b02572001-04-15 00:37:09 +0000335 if( rc!=SQLITE_OK || memcmp(aMagic,aJournalMagic,sizeof(aMagic))!=0 ){
drh81a20f22001-10-12 17:30:04 +0000336 rc = SQLITE_PROTOCOL;
337 goto end_playback;
drhd9b02572001-04-15 00:37:09 +0000338 }
drha7fcb052001-12-14 15:09:55 +0000339 rc = sqliteOsRead(&pPager->jfd, &mxPg, sizeof(mxPg));
drhd9b02572001-04-15 00:37:09 +0000340 if( rc!=SQLITE_OK ){
drh81a20f22001-10-12 17:30:04 +0000341 goto end_playback;
drhd9b02572001-04-15 00:37:09 +0000342 }
drha7fcb052001-12-14 15:09:55 +0000343 rc = sqliteOsTruncate(&pPager->fd, mxPg*SQLITE_PAGE_SIZE);
drh81a20f22001-10-12 17:30:04 +0000344 if( rc!=SQLITE_OK ){
345 goto end_playback;
346 }
drhd9b02572001-04-15 00:37:09 +0000347 pPager->dbSize = mxPg;
348
drhfa86c412002-02-02 15:01:15 +0000349 /* Copy original pages out of the journal and back into the database file.
drhed7c8552001-04-11 14:29:21 +0000350 */
drhd9b02572001-04-15 00:37:09 +0000351 for(i=nRec-1; i>=0; i--){
drhfa86c412002-02-02 15:01:15 +0000352 rc = pager_playback_one_page(pPager, &pPager->jfd);
drhd9b02572001-04-15 00:37:09 +0000353 if( rc!=SQLITE_OK ) break;
drhed7c8552001-04-11 14:29:21 +0000354 }
drh81a20f22001-10-12 17:30:04 +0000355
356end_playback:
drhd9b02572001-04-15 00:37:09 +0000357 if( rc!=SQLITE_OK ){
358 pager_unwritelock(pPager);
359 pPager->errMask |= PAGER_ERR_CORRUPT;
360 rc = SQLITE_CORRUPT;
361 }else{
362 rc = pager_unwritelock(pPager);
drhed7c8552001-04-11 14:29:21 +0000363 }
drhd9b02572001-04-15 00:37:09 +0000364 return rc;
drhed7c8552001-04-11 14:29:21 +0000365}
366
367/*
drhfa86c412002-02-02 15:01:15 +0000368** Playback the checkpoint journal.
369**
370** This is similar to playing back the transaction journal but with
371** a few extra twists.
372**
drh663fc632002-02-02 18:49:19 +0000373** (1) The number of pages in the database file at the start of
374** the checkpoint is stored in pPager->ckptSize, not in the
375** journal file itself.
drhfa86c412002-02-02 15:01:15 +0000376**
377** (2) In addition to playing back the checkpoint journal, also
378** playback all pages of the transaction journal beginning
379** at offset pPager->ckptJSize.
380*/
381static int pager_ckpt_playback(Pager *pPager){
382 int nRec; /* Number of Records */
383 int i; /* Loop counter */
384 int rc;
385
386 /* Truncate the database back to its original size.
387 */
drh663fc632002-02-02 18:49:19 +0000388 rc = sqliteOsTruncate(&pPager->fd, pPager->ckptSize*SQLITE_PAGE_SIZE);
drhfa86c412002-02-02 15:01:15 +0000389 pPager->dbSize = pPager->ckptSize;
390
391 /* Figure out how many records are in the checkpoint journal.
392 */
393 assert( pPager->ckptOpen && pPager->journalOpen );
394 sqliteOsSeek(&pPager->cpfd, 0);
395 rc = sqliteOsFileSize(&pPager->cpfd, &nRec);
396 if( rc!=SQLITE_OK ){
397 goto end_ckpt_playback;
398 }
399 nRec /= sizeof(PageRecord);
400
401 /* Copy original pages out of the checkpoint journal and back into the
402 ** database file.
403 */
404 for(i=nRec-1; i>=0; i--){
405 rc = pager_playback_one_page(pPager, &pPager->cpfd);
406 if( rc!=SQLITE_OK ) goto end_ckpt_playback;
407 }
408
409 /* Figure out how many pages need to be copied out of the transaction
410 ** journal.
411 */
412 rc = sqliteOsSeek(&pPager->jfd, pPager->ckptJSize);
413 if( rc!=SQLITE_OK ){
414 goto end_ckpt_playback;
415 }
416 rc = sqliteOsFileSize(&pPager->jfd, &nRec);
417 if( rc!=SQLITE_OK ){
418 goto end_ckpt_playback;
419 }
420 nRec = (nRec - pPager->ckptJSize)/sizeof(PageRecord);
421 for(i=nRec-1; i>=0; i--){
422 rc = pager_playback_one_page(pPager, &pPager->jfd);
423 if( rc!=SQLITE_OK ) goto end_ckpt_playback;
424 }
425
426
427end_ckpt_playback:
drhfa86c412002-02-02 15:01:15 +0000428 if( rc!=SQLITE_OK ){
drhfa86c412002-02-02 15:01:15 +0000429 pPager->errMask |= PAGER_ERR_CORRUPT;
430 rc = SQLITE_CORRUPT;
drhfa86c412002-02-02 15:01:15 +0000431 }
432 return rc;
433}
434
435/*
drhf57b14a2001-09-14 18:54:08 +0000436** Change the maximum number of in-memory pages that are allowed.
437*/
438void sqlitepager_set_cachesize(Pager *pPager, int mxPage){
drh603240c2002-03-05 01:11:12 +0000439 if( mxPage>=0 ){
440 pPager->noSync = 0;
441 }else{
442 pPager->noSync = 1;
443 mxPage = -mxPage;
444 }
drhf57b14a2001-09-14 18:54:08 +0000445 if( mxPage>10 ){
446 pPager->mxPage = mxPage;
447 }
448}
449
450/*
drhfa86c412002-02-02 15:01:15 +0000451** Open a temporary file. Write the name of the file into zName
452** (zName must be at least SQLITE_TEMPNAME_SIZE bytes long.) Write
453** the file descriptor into *fd. Return SQLITE_OK on success or some
454** other error code if we fail.
455**
456** The OS will automatically delete the temporary file when it is
457** closed.
458*/
459static int sqlitepager_opentemp(char *zFile, OsFile *fd){
460 int cnt = 8;
461 int rc;
462 do{
463 cnt--;
464 sqliteOsTempFileName(zFile);
465 rc = sqliteOsOpenExclusive(zFile, fd, 1);
466 }while( cnt>0 && rc!=SQLITE_OK );
467 return rc;
468}
469
470/*
drhed7c8552001-04-11 14:29:21 +0000471** Create a new page cache and put a pointer to the page cache in *ppPager.
drh5e00f6c2001-09-13 13:46:56 +0000472** The file to be cached need not exist. The file is not locked until
drhd9b02572001-04-15 00:37:09 +0000473** the first call to sqlitepager_get() and is only held open until the
474** last page is released using sqlitepager_unref().
drh382c0242001-10-06 16:33:02 +0000475**
drh6446c4d2001-12-15 14:22:18 +0000476** If zFilename is NULL then a randomly-named temporary file is created
477** and used as the file to be cached. The file will be deleted
478** automatically when it is closed.
drhed7c8552001-04-11 14:29:21 +0000479*/
drh7e3b0a02001-04-28 16:52:40 +0000480int sqlitepager_open(
481 Pager **ppPager, /* Return the Pager structure here */
482 const char *zFilename, /* Name of the database file to open */
483 int mxPage, /* Max number of in-memory cache pages */
484 int nExtra /* Extra bytes append to each in-memory page */
485){
drhed7c8552001-04-11 14:29:21 +0000486 Pager *pPager;
487 int nameLen;
drh8cfbf082001-09-19 13:22:39 +0000488 OsFile fd;
489 int rc;
drh5e00f6c2001-09-13 13:46:56 +0000490 int tempFile;
491 int readOnly = 0;
drh8cfbf082001-09-19 13:22:39 +0000492 char zTemp[SQLITE_TEMPNAME_SIZE];
drhed7c8552001-04-11 14:29:21 +0000493
drhd9b02572001-04-15 00:37:09 +0000494 *ppPager = 0;
495 if( sqlite_malloc_failed ){
496 return SQLITE_NOMEM;
497 }
drh5e00f6c2001-09-13 13:46:56 +0000498 if( zFilename ){
drh8cfbf082001-09-19 13:22:39 +0000499 rc = sqliteOsOpenReadWrite(zFilename, &fd, &readOnly);
drh5e00f6c2001-09-13 13:46:56 +0000500 tempFile = 0;
501 }else{
drhfa86c412002-02-02 15:01:15 +0000502 rc = sqlitepager_opentemp(zTemp, &fd);
drh5e00f6c2001-09-13 13:46:56 +0000503 zFilename = zTemp;
504 tempFile = 1;
505 }
drh8cfbf082001-09-19 13:22:39 +0000506 if( rc!=SQLITE_OK ){
drhed7c8552001-04-11 14:29:21 +0000507 return SQLITE_CANTOPEN;
508 }
509 nameLen = strlen(zFilename);
510 pPager = sqliteMalloc( sizeof(*pPager) + nameLen*2 + 30 );
drhd9b02572001-04-15 00:37:09 +0000511 if( pPager==0 ){
drha7fcb052001-12-14 15:09:55 +0000512 sqliteOsClose(&fd);
drhd9b02572001-04-15 00:37:09 +0000513 return SQLITE_NOMEM;
514 }
drhed7c8552001-04-11 14:29:21 +0000515 pPager->zFilename = (char*)&pPager[1];
516 pPager->zJournal = &pPager->zFilename[nameLen+1];
517 strcpy(pPager->zFilename, zFilename);
518 strcpy(pPager->zJournal, zFilename);
519 strcpy(&pPager->zJournal[nameLen], "-journal");
520 pPager->fd = fd;
drh8cfbf082001-09-19 13:22:39 +0000521 pPager->journalOpen = 0;
drhfa86c412002-02-02 15:01:15 +0000522 pPager->ckptOpen = 0;
drhed7c8552001-04-11 14:29:21 +0000523 pPager->nRef = 0;
524 pPager->dbSize = -1;
drhfa86c412002-02-02 15:01:15 +0000525 pPager->ckptSize = 0;
526 pPager->ckptJSize = 0;
drhed7c8552001-04-11 14:29:21 +0000527 pPager->nPage = 0;
drhd79caeb2001-04-15 02:27:24 +0000528 pPager->mxPage = mxPage>5 ? mxPage : 10;
drhed7c8552001-04-11 14:29:21 +0000529 pPager->state = SQLITE_UNLOCK;
drhd9b02572001-04-15 00:37:09 +0000530 pPager->errMask = 0;
drh5e00f6c2001-09-13 13:46:56 +0000531 pPager->tempFile = tempFile;
532 pPager->readOnly = readOnly;
drhf57b14a2001-09-14 18:54:08 +0000533 pPager->needSync = 0;
drhed7c8552001-04-11 14:29:21 +0000534 pPager->pFirst = 0;
535 pPager->pLast = 0;
drh7c717f72001-06-24 20:39:41 +0000536 pPager->nExtra = nExtra;
drhed7c8552001-04-11 14:29:21 +0000537 memset(pPager->aHash, 0, sizeof(pPager->aHash));
538 *ppPager = pPager;
539 return SQLITE_OK;
540}
541
542/*
drh72f82862001-05-24 21:06:34 +0000543** Set the destructor for this pager. If not NULL, the destructor is called
drh5e00f6c2001-09-13 13:46:56 +0000544** when the reference count on each page reaches zero. The destructor can
545** be used to clean up information in the extra segment appended to each page.
drh72f82862001-05-24 21:06:34 +0000546**
547** The destructor is not called as a result sqlitepager_close().
548** Destructors are only called by sqlitepager_unref().
549*/
550void sqlitepager_set_destructor(Pager *pPager, void (*xDesc)(void*)){
551 pPager->xDestructor = xDesc;
552}
553
554/*
drh5e00f6c2001-09-13 13:46:56 +0000555** Return the total number of pages in the disk file associated with
556** pPager.
drhed7c8552001-04-11 14:29:21 +0000557*/
drhd9b02572001-04-15 00:37:09 +0000558int sqlitepager_pagecount(Pager *pPager){
drhed7c8552001-04-11 14:29:21 +0000559 int n;
drhd9b02572001-04-15 00:37:09 +0000560 assert( pPager!=0 );
drhed7c8552001-04-11 14:29:21 +0000561 if( pPager->dbSize>=0 ){
562 return pPager->dbSize;
563 }
drha7fcb052001-12-14 15:09:55 +0000564 if( sqliteOsFileSize(&pPager->fd, &n)!=SQLITE_OK ){
drh81a20f22001-10-12 17:30:04 +0000565 pPager->errMask |= PAGER_ERR_DISK;
drh8cfbf082001-09-19 13:22:39 +0000566 return 0;
drhed7c8552001-04-11 14:29:21 +0000567 }
drh8cfbf082001-09-19 13:22:39 +0000568 n /= SQLITE_PAGE_SIZE;
drhd9b02572001-04-15 00:37:09 +0000569 if( pPager->state!=SQLITE_UNLOCK ){
drhed7c8552001-04-11 14:29:21 +0000570 pPager->dbSize = n;
571 }
572 return n;
573}
574
575/*
576** Shutdown the page cache. Free all memory and close all files.
577**
578** If a transaction was in progress when this routine is called, that
579** transaction is rolled back. All outstanding pages are invalidated
580** and their memory is freed. Any attempt to use a page associated
581** with this page cache after this function returns will likely
582** result in a coredump.
583*/
drhd9b02572001-04-15 00:37:09 +0000584int sqlitepager_close(Pager *pPager){
585 PgHdr *pPg, *pNext;
drhed7c8552001-04-11 14:29:21 +0000586 switch( pPager->state ){
587 case SQLITE_WRITELOCK: {
drhd9b02572001-04-15 00:37:09 +0000588 sqlitepager_rollback(pPager);
drha7fcb052001-12-14 15:09:55 +0000589 sqliteOsUnlock(&pPager->fd);
drh8cfbf082001-09-19 13:22:39 +0000590 assert( pPager->journalOpen==0 );
drhed7c8552001-04-11 14:29:21 +0000591 break;
592 }
593 case SQLITE_READLOCK: {
drha7fcb052001-12-14 15:09:55 +0000594 sqliteOsUnlock(&pPager->fd);
drhed7c8552001-04-11 14:29:21 +0000595 break;
596 }
597 default: {
598 /* Do nothing */
599 break;
600 }
601 }
drhd9b02572001-04-15 00:37:09 +0000602 for(pPg=pPager->pAll; pPg; pPg=pNext){
603 pNext = pPg->pNextAll;
604 sqliteFree(pPg);
drhed7c8552001-04-11 14:29:21 +0000605 }
drha7fcb052001-12-14 15:09:55 +0000606 sqliteOsClose(&pPager->fd);
drh8cfbf082001-09-19 13:22:39 +0000607 assert( pPager->journalOpen==0 );
drh5e00f6c2001-09-13 13:46:56 +0000608 if( pPager->tempFile ){
drhfa86c412002-02-02 15:01:15 +0000609 /* sqliteOsDelete(pPager->zFilename); */
drh5e00f6c2001-09-13 13:46:56 +0000610 }
drhed7c8552001-04-11 14:29:21 +0000611 sqliteFree(pPager);
612 return SQLITE_OK;
613}
614
615/*
drh5e00f6c2001-09-13 13:46:56 +0000616** Return the page number for the given page data.
drhed7c8552001-04-11 14:29:21 +0000617*/
drhd9b02572001-04-15 00:37:09 +0000618Pgno sqlitepager_pagenumber(void *pData){
drhed7c8552001-04-11 14:29:21 +0000619 PgHdr *p = DATA_TO_PGHDR(pData);
620 return p->pgno;
621}
622
623/*
drh7e3b0a02001-04-28 16:52:40 +0000624** Increment the reference count for a page. If the page is
625** currently on the freelist (the reference count is zero) then
626** remove it from the freelist.
627*/
drhdf0b3b02001-06-23 11:36:20 +0000628static void page_ref(PgHdr *pPg){
drh7e3b0a02001-04-28 16:52:40 +0000629 if( pPg->nRef==0 ){
630 /* The page is currently on the freelist. Remove it. */
631 if( pPg->pPrevFree ){
632 pPg->pPrevFree->pNextFree = pPg->pNextFree;
633 }else{
634 pPg->pPager->pFirst = pPg->pNextFree;
635 }
636 if( pPg->pNextFree ){
637 pPg->pNextFree->pPrevFree = pPg->pPrevFree;
638 }else{
639 pPg->pPager->pLast = pPg->pPrevFree;
640 }
641 pPg->pPager->nRef++;
642 }
643 pPg->nRef++;
drhdd793422001-06-28 01:54:48 +0000644 REFINFO(pPg);
drhdf0b3b02001-06-23 11:36:20 +0000645}
646
647/*
648** Increment the reference count for a page. The input pointer is
649** a reference to the page data.
650*/
651int sqlitepager_ref(void *pData){
652 PgHdr *pPg = DATA_TO_PGHDR(pData);
653 page_ref(pPg);
drh8c42ca92001-06-22 19:15:00 +0000654 return SQLITE_OK;
drh7e3b0a02001-04-28 16:52:40 +0000655}
656
657/*
drhb19a2bc2001-09-16 00:13:26 +0000658** Sync the journal and then write all free dirty pages to the database
659** file.
660**
661** Writing all free dirty pages to the database after the sync is a
662** non-obvious optimization. fsync() is an expensive operation so we
drhaaab5722002-02-19 13:39:21 +0000663** want to minimize the number ot times it is called. After an fsync() call,
drh6446c4d2001-12-15 14:22:18 +0000664** we are free to write dirty pages back to the database. It is best
665** to go ahead and write as many dirty pages as possible to minimize
666** the risk of having to do another fsync() later on. Writing dirty
667** free pages in this way was observed to make database operations go
668** up to 10 times faster.
drhfa86c412002-02-02 15:01:15 +0000669**
670** If we are writing to temporary database, there is no need to preserve
671** the integrity of the journal file, so we can save time and skip the
672** fsync().
drh50e5dad2001-09-15 00:57:28 +0000673*/
674static int syncAllPages(Pager *pPager){
675 PgHdr *pPg;
676 int rc = SQLITE_OK;
677 if( pPager->needSync ){
drhfa86c412002-02-02 15:01:15 +0000678 if( !pPager->tempFile ){
679 rc = sqliteOsSync(&pPager->jfd);
680 if( rc!=0 ) return rc;
681 }
drh50e5dad2001-09-15 00:57:28 +0000682 pPager->needSync = 0;
683 }
684 for(pPg=pPager->pFirst; pPg; pPg=pPg->pNextFree){
685 if( pPg->dirty ){
drha7fcb052001-12-14 15:09:55 +0000686 sqliteOsSeek(&pPager->fd, (pPg->pgno-1)*SQLITE_PAGE_SIZE);
687 rc = sqliteOsWrite(&pPager->fd, PGHDR_TO_DATA(pPg), SQLITE_PAGE_SIZE);
drh50e5dad2001-09-15 00:57:28 +0000688 if( rc!=SQLITE_OK ) break;
689 pPg->dirty = 0;
690 }
691 }
drh81a20f22001-10-12 17:30:04 +0000692 return rc;
drh50e5dad2001-09-15 00:57:28 +0000693}
694
695/*
drhd9b02572001-04-15 00:37:09 +0000696** Acquire a page.
697**
drh58a11682001-11-10 13:51:08 +0000698** A read lock on the disk file is obtained when the first page is acquired.
drh5e00f6c2001-09-13 13:46:56 +0000699** This read lock is dropped when the last page is released.
drhd9b02572001-04-15 00:37:09 +0000700**
drh306dc212001-05-21 13:45:10 +0000701** A _get works for any page number greater than 0. If the database
702** file is smaller than the requested page, then no actual disk
703** read occurs and the memory image of the page is initialized to
704** all zeros. The extra data appended to a page is always initialized
705** to zeros the first time a page is loaded into memory.
706**
drhd9b02572001-04-15 00:37:09 +0000707** The acquisition might fail for several reasons. In all cases,
708** an appropriate error code is returned and *ppPage is set to NULL.
drh7e3b0a02001-04-28 16:52:40 +0000709**
710** See also sqlitepager_lookup(). Both this routine and _lookup() attempt
711** to find a page in the in-memory cache first. If the page is not already
drh5e00f6c2001-09-13 13:46:56 +0000712** in memory, this routine goes to disk to read it in whereas _lookup()
drh7e3b0a02001-04-28 16:52:40 +0000713** just returns 0. This routine acquires a read-lock the first time it
714** has to go to disk, and could also playback an old journal if necessary.
715** Since _lookup() never goes to disk, it never has to deal with locks
716** or journal files.
drhed7c8552001-04-11 14:29:21 +0000717*/
drhd9b02572001-04-15 00:37:09 +0000718int sqlitepager_get(Pager *pPager, Pgno pgno, void **ppPage){
drhed7c8552001-04-11 14:29:21 +0000719 PgHdr *pPg;
720
drhd9b02572001-04-15 00:37:09 +0000721 /* Make sure we have not hit any critical errors.
722 */
723 if( pPager==0 || pgno==0 ){
724 return SQLITE_ERROR;
725 }
726 if( pPager->errMask & ~(PAGER_ERR_FULL) ){
727 return pager_errcode(pPager);
728 }
729
drhed7c8552001-04-11 14:29:21 +0000730 /* If this is the first page accessed, then get a read lock
731 ** on the database file.
732 */
733 if( pPager->nRef==0 ){
drha7fcb052001-12-14 15:09:55 +0000734 if( sqliteOsReadLock(&pPager->fd)!=SQLITE_OK ){
drhed7c8552001-04-11 14:29:21 +0000735 *ppPage = 0;
736 return SQLITE_BUSY;
737 }
drhd9b02572001-04-15 00:37:09 +0000738 pPager->state = SQLITE_READLOCK;
drhed7c8552001-04-11 14:29:21 +0000739
740 /* If a journal file exists, try to play it back.
741 */
drh8cfbf082001-09-19 13:22:39 +0000742 if( sqliteOsFileExists(pPager->zJournal) ){
drhf57b3392001-10-08 13:22:32 +0000743 int rc, dummy;
drhed7c8552001-04-11 14:29:21 +0000744
drha7fcb052001-12-14 15:09:55 +0000745 /* Get a write lock on the database
746 */
747 rc = sqliteOsWriteLock(&pPager->fd);
748 if( rc!=SQLITE_OK ){
drh6446c4d2001-12-15 14:22:18 +0000749 rc = sqliteOsUnlock(&pPager->fd);
drha7fcb052001-12-14 15:09:55 +0000750 assert( rc==SQLITE_OK );
751 *ppPage = 0;
752 return SQLITE_BUSY;
753 }
754 pPager->state = SQLITE_WRITELOCK;
755
drhed7c8552001-04-11 14:29:21 +0000756 /* Open the journal for exclusive access. Return SQLITE_BUSY if
drhf57b3392001-10-08 13:22:32 +0000757 ** we cannot get exclusive access to the journal file.
758 **
759 ** Even though we will only be reading from the journal, not writing,
760 ** we have to open the journal for writing in order to obtain an
761 ** exclusive access lock.
drhed7c8552001-04-11 14:29:21 +0000762 */
drhf57b3392001-10-08 13:22:32 +0000763 rc = sqliteOsOpenReadWrite(pPager->zJournal, &pPager->jfd, &dummy);
drha7fcb052001-12-14 15:09:55 +0000764 if( rc!=SQLITE_OK ){
765 rc = sqliteOsUnlock(&pPager->fd);
766 assert( rc==SQLITE_OK );
drhed7c8552001-04-11 14:29:21 +0000767 *ppPage = 0;
768 return SQLITE_BUSY;
769 }
drha7fcb052001-12-14 15:09:55 +0000770 pPager->journalOpen = 1;
drhed7c8552001-04-11 14:29:21 +0000771
772 /* Playback and delete the journal. Drop the database write
773 ** lock and reacquire the read lock.
774 */
drhd9b02572001-04-15 00:37:09 +0000775 rc = pager_playback(pPager);
776 if( rc!=SQLITE_OK ){
777 return rc;
778 }
drhed7c8552001-04-11 14:29:21 +0000779 }
780 pPg = 0;
781 }else{
782 /* Search for page in cache */
drhd9b02572001-04-15 00:37:09 +0000783 pPg = pager_lookup(pPager, pgno);
drhed7c8552001-04-11 14:29:21 +0000784 }
785 if( pPg==0 ){
drhd9b02572001-04-15 00:37:09 +0000786 /* The requested page is not in the page cache. */
drhed7c8552001-04-11 14:29:21 +0000787 int h;
drh7e3b0a02001-04-28 16:52:40 +0000788 pPager->nMiss++;
drhed7c8552001-04-11 14:29:21 +0000789 if( pPager->nPage<pPager->mxPage || pPager->pFirst==0 ){
790 /* Create a new page */
drh7e3b0a02001-04-28 16:52:40 +0000791 pPg = sqliteMalloc( sizeof(*pPg) + SQLITE_PAGE_SIZE + pPager->nExtra );
drhd9b02572001-04-15 00:37:09 +0000792 if( pPg==0 ){
793 *ppPage = 0;
794 pager_unwritelock(pPager);
795 pPager->errMask |= PAGER_ERR_MEM;
796 return SQLITE_NOMEM;
797 }
drhed7c8552001-04-11 14:29:21 +0000798 pPg->pPager = pPager;
drhd9b02572001-04-15 00:37:09 +0000799 pPg->pNextAll = pPager->pAll;
800 if( pPager->pAll ){
801 pPager->pAll->pPrevAll = pPg;
802 }
803 pPg->pPrevAll = 0;
drhd79caeb2001-04-15 02:27:24 +0000804 pPager->pAll = pPg;
drhd9b02572001-04-15 00:37:09 +0000805 pPager->nPage++;
drhed7c8552001-04-11 14:29:21 +0000806 }else{
drhd9b02572001-04-15 00:37:09 +0000807 /* Recycle an older page. First locate the page to be recycled.
808 ** Try to find one that is not dirty and is near the head of
809 ** of the free list */
drhed7c8552001-04-11 14:29:21 +0000810 pPg = pPager->pFirst;
drh603240c2002-03-05 01:11:12 +0000811 while( pPg && pPg->dirty ){
drhd9b02572001-04-15 00:37:09 +0000812 pPg = pPg->pNextFree;
813 }
drhb19a2bc2001-09-16 00:13:26 +0000814
815 /* If we could not find a page that has not been used recently
816 ** and which is not dirty, then sync the journal and write all
817 ** dirty free pages into the database file, thus making them
818 ** clean pages and available for recycling.
819 **
820 ** We have to sync the journal before writing a page to the main
821 ** database. But syncing is a very slow operation. So after a
822 ** sync, it is best to write everything we can back to the main
823 ** database to minimize the risk of having to sync again in the
824 ** near future. That is way we write all dirty pages after a
825 ** sync.
826 */
drh603240c2002-03-05 01:11:12 +0000827 if( pPg==0 ){
drh50e5dad2001-09-15 00:57:28 +0000828 int rc = syncAllPages(pPager);
829 if( rc!=0 ){
830 sqlitepager_rollback(pPager);
831 *ppPage = 0;
832 return SQLITE_IOERR;
833 }
834 pPg = pPager->pFirst;
835 }
drhd9b02572001-04-15 00:37:09 +0000836 assert( pPg->nRef==0 );
drh50e5dad2001-09-15 00:57:28 +0000837 assert( pPg->dirty==0 );
drhd9b02572001-04-15 00:37:09 +0000838
839 /* Unlink the old page from the free list and the hash table
840 */
drh6019e162001-07-02 17:51:45 +0000841 if( pPg->pPrevFree ){
842 pPg->pPrevFree->pNextFree = pPg->pNextFree;
drhed7c8552001-04-11 14:29:21 +0000843 }else{
drh6019e162001-07-02 17:51:45 +0000844 assert( pPager->pFirst==pPg );
845 pPager->pFirst = pPg->pNextFree;
drhed7c8552001-04-11 14:29:21 +0000846 }
drh6019e162001-07-02 17:51:45 +0000847 if( pPg->pNextFree ){
848 pPg->pNextFree->pPrevFree = pPg->pPrevFree;
849 }else{
850 assert( pPager->pLast==pPg );
851 pPager->pLast = pPg->pPrevFree;
852 }
853 pPg->pNextFree = pPg->pPrevFree = 0;
drhed7c8552001-04-11 14:29:21 +0000854 if( pPg->pNextHash ){
855 pPg->pNextHash->pPrevHash = pPg->pPrevHash;
856 }
857 if( pPg->pPrevHash ){
858 pPg->pPrevHash->pNextHash = pPg->pNextHash;
859 }else{
drhd9b02572001-04-15 00:37:09 +0000860 h = pager_hash(pPg->pgno);
drhed7c8552001-04-11 14:29:21 +0000861 assert( pPager->aHash[h]==pPg );
862 pPager->aHash[h] = pPg->pNextHash;
863 }
drh6019e162001-07-02 17:51:45 +0000864 pPg->pNextHash = pPg->pPrevHash = 0;
drhd9b02572001-04-15 00:37:09 +0000865 pPager->nOvfl++;
drhed7c8552001-04-11 14:29:21 +0000866 }
867 pPg->pgno = pgno;
drh1ab43002002-01-14 09:28:19 +0000868 if( pPager->aInJournal && (int)pgno<=pPager->origDbSize ){
drh6019e162001-07-02 17:51:45 +0000869 pPg->inJournal = (pPager->aInJournal[pgno/8] & (1<<(pgno&7)))!=0;
870 }else{
871 pPg->inJournal = 0;
872 }
drh663fc632002-02-02 18:49:19 +0000873 if( pPager->aInCkpt && (int)pgno<=pPager->ckptSize ){
drhfa86c412002-02-02 15:01:15 +0000874 pPg->inCkpt = (pPager->aInCkpt[pgno/8] & (1<<(pgno&7)))!=0;
875 }else{
876 pPg->inCkpt = 0;
877 }
drhed7c8552001-04-11 14:29:21 +0000878 pPg->dirty = 0;
879 pPg->nRef = 1;
drhdd793422001-06-28 01:54:48 +0000880 REFINFO(pPg);
drhd9b02572001-04-15 00:37:09 +0000881 pPager->nRef++;
882 h = pager_hash(pgno);
drhed7c8552001-04-11 14:29:21 +0000883 pPg->pNextHash = pPager->aHash[h];
884 pPager->aHash[h] = pPg;
885 if( pPg->pNextHash ){
886 assert( pPg->pNextHash->pPrevHash==0 );
887 pPg->pNextHash->pPrevHash = pPg;
888 }
drh306dc212001-05-21 13:45:10 +0000889 if( pPager->dbSize<0 ) sqlitepager_pagecount(pPager);
drh1ab43002002-01-14 09:28:19 +0000890 if( pPager->dbSize<(int)pgno ){
drh306dc212001-05-21 13:45:10 +0000891 memset(PGHDR_TO_DATA(pPg), 0, SQLITE_PAGE_SIZE);
892 }else{
drh81a20f22001-10-12 17:30:04 +0000893 int rc;
drha7fcb052001-12-14 15:09:55 +0000894 sqliteOsSeek(&pPager->fd, (pgno-1)*SQLITE_PAGE_SIZE);
895 rc = sqliteOsRead(&pPager->fd, PGHDR_TO_DATA(pPg), SQLITE_PAGE_SIZE);
drh81a20f22001-10-12 17:30:04 +0000896 if( rc!=SQLITE_OK ){
897 return rc;
898 }
drh306dc212001-05-21 13:45:10 +0000899 }
drh7e3b0a02001-04-28 16:52:40 +0000900 if( pPager->nExtra>0 ){
901 memset(PGHDR_TO_EXTRA(pPg), 0, pPager->nExtra);
902 }
drhed7c8552001-04-11 14:29:21 +0000903 }else{
drhd9b02572001-04-15 00:37:09 +0000904 /* The requested page is in the page cache. */
drh7e3b0a02001-04-28 16:52:40 +0000905 pPager->nHit++;
drhdf0b3b02001-06-23 11:36:20 +0000906 page_ref(pPg);
drhed7c8552001-04-11 14:29:21 +0000907 }
908 *ppPage = PGHDR_TO_DATA(pPg);
909 return SQLITE_OK;
910}
911
912/*
drh7e3b0a02001-04-28 16:52:40 +0000913** Acquire a page if it is already in the in-memory cache. Do
914** not read the page from disk. Return a pointer to the page,
915** or 0 if the page is not in cache.
916**
917** See also sqlitepager_get(). The difference between this routine
918** and sqlitepager_get() is that _get() will go to the disk and read
919** in the page if the page is not already in cache. This routine
drh5e00f6c2001-09-13 13:46:56 +0000920** returns NULL if the page is not in cache or if a disk I/O error
921** has ever happened.
drh7e3b0a02001-04-28 16:52:40 +0000922*/
923void *sqlitepager_lookup(Pager *pPager, Pgno pgno){
924 PgHdr *pPg;
925
926 /* Make sure we have not hit any critical errors.
927 */
928 if( pPager==0 || pgno==0 ){
929 return 0;
930 }
931 if( pPager->errMask & ~(PAGER_ERR_FULL) ){
932 return 0;
933 }
934 if( pPager->nRef==0 ){
935 return 0;
936 }
937 pPg = pager_lookup(pPager, pgno);
938 if( pPg==0 ) return 0;
drhdf0b3b02001-06-23 11:36:20 +0000939 page_ref(pPg);
drh7e3b0a02001-04-28 16:52:40 +0000940 return PGHDR_TO_DATA(pPg);
941}
942
943/*
drhed7c8552001-04-11 14:29:21 +0000944** Release a page.
945**
946** If the number of references to the page drop to zero, then the
947** page is added to the LRU list. When all references to all pages
drhd9b02572001-04-15 00:37:09 +0000948** are released, a rollback occurs and the lock on the database is
drhed7c8552001-04-11 14:29:21 +0000949** removed.
950*/
drhd9b02572001-04-15 00:37:09 +0000951int sqlitepager_unref(void *pData){
drhed7c8552001-04-11 14:29:21 +0000952 PgHdr *pPg;
drhd9b02572001-04-15 00:37:09 +0000953
954 /* Decrement the reference count for this page
955 */
drhed7c8552001-04-11 14:29:21 +0000956 pPg = DATA_TO_PGHDR(pData);
957 assert( pPg->nRef>0 );
drhed7c8552001-04-11 14:29:21 +0000958 pPg->nRef--;
drhdd793422001-06-28 01:54:48 +0000959 REFINFO(pPg);
drhd9b02572001-04-15 00:37:09 +0000960
drh72f82862001-05-24 21:06:34 +0000961 /* When the number of references to a page reach 0, call the
962 ** destructor and add the page to the freelist.
drhd9b02572001-04-15 00:37:09 +0000963 */
drhed7c8552001-04-11 14:29:21 +0000964 if( pPg->nRef==0 ){
drh1eaa2692001-09-18 02:02:23 +0000965 Pager *pPager;
966 pPager = pPg->pPager;
drhd9b02572001-04-15 00:37:09 +0000967 pPg->pNextFree = 0;
968 pPg->pPrevFree = pPager->pLast;
drhed7c8552001-04-11 14:29:21 +0000969 pPager->pLast = pPg;
drhd9b02572001-04-15 00:37:09 +0000970 if( pPg->pPrevFree ){
971 pPg->pPrevFree->pNextFree = pPg;
drhed7c8552001-04-11 14:29:21 +0000972 }else{
973 pPager->pFirst = pPg;
974 }
drh72f82862001-05-24 21:06:34 +0000975 if( pPager->xDestructor ){
976 pPager->xDestructor(pData);
977 }
drhd9b02572001-04-15 00:37:09 +0000978
979 /* When all pages reach the freelist, drop the read lock from
980 ** the database file.
981 */
982 pPager->nRef--;
983 assert( pPager->nRef>=0 );
984 if( pPager->nRef==0 ){
985 pager_reset(pPager);
986 }
drhed7c8552001-04-11 14:29:21 +0000987 }
drhd9b02572001-04-15 00:37:09 +0000988 return SQLITE_OK;
drhed7c8552001-04-11 14:29:21 +0000989}
990
991/*
992** Mark a data page as writeable. The page is written into the journal
993** if it is not there already. This routine must be called before making
994** changes to a page.
995**
996** The first time this routine is called, the pager creates a new
997** journal and acquires a write lock on the database. If the write
998** lock could not be acquired, this routine returns SQLITE_BUSY. The
drh306dc212001-05-21 13:45:10 +0000999** calling routine must check for that return value and be careful not to
drhed7c8552001-04-11 14:29:21 +00001000** change any page data until this routine returns SQLITE_OK.
drhd9b02572001-04-15 00:37:09 +00001001**
1002** If the journal file could not be written because the disk is full,
1003** then this routine returns SQLITE_FULL and does an immediate rollback.
1004** All subsequent write attempts also return SQLITE_FULL until there
1005** is a call to sqlitepager_commit() or sqlitepager_rollback() to
1006** reset.
drhed7c8552001-04-11 14:29:21 +00001007*/
drhd9b02572001-04-15 00:37:09 +00001008int sqlitepager_write(void *pData){
drh69688d52001-04-14 16:38:23 +00001009 PgHdr *pPg = DATA_TO_PGHDR(pData);
1010 Pager *pPager = pPg->pPager;
drhd79caeb2001-04-15 02:27:24 +00001011 int rc = SQLITE_OK;
drh69688d52001-04-14 16:38:23 +00001012
drh6446c4d2001-12-15 14:22:18 +00001013 /* Check for errors
1014 */
drhd9b02572001-04-15 00:37:09 +00001015 if( pPager->errMask ){
1016 return pager_errcode(pPager);
1017 }
drh5e00f6c2001-09-13 13:46:56 +00001018 if( pPager->readOnly ){
1019 return SQLITE_PERM;
1020 }
drh6446c4d2001-12-15 14:22:18 +00001021
1022 /* Mark the page as dirty. If the page has already been written
1023 ** to the journal then we can return right away.
1024 */
drhd9b02572001-04-15 00:37:09 +00001025 pPg->dirty = 1;
drhfa86c412002-02-02 15:01:15 +00001026 if( pPg->inJournal && (pPg->inCkpt || pPager->ckptOpen==0) ){
1027 return SQLITE_OK;
1028 }
drh6446c4d2001-12-15 14:22:18 +00001029
1030 /* If we get this far, it means that the page needs to be
drhfa86c412002-02-02 15:01:15 +00001031 ** written to the transaction journal or the ckeckpoint journal
1032 ** or both.
1033 **
1034 ** First check to see that the transaction journal exists and
1035 ** create it if it does not.
drh6446c4d2001-12-15 14:22:18 +00001036 */
drhd9b02572001-04-15 00:37:09 +00001037 assert( pPager->state!=SQLITE_UNLOCK );
drhed7c8552001-04-11 14:29:21 +00001038 if( pPager->state==SQLITE_READLOCK ){
drh6019e162001-07-02 17:51:45 +00001039 assert( pPager->aInJournal==0 );
drha7fcb052001-12-14 15:09:55 +00001040 rc = sqliteOsWriteLock(&pPager->fd);
1041 if( rc!=SQLITE_OK ){
1042 return rc;
1043 }
drh6019e162001-07-02 17:51:45 +00001044 pPager->aInJournal = sqliteMalloc( pPager->dbSize/8 + 1 );
1045 if( pPager->aInJournal==0 ){
drha7fcb052001-12-14 15:09:55 +00001046 sqliteOsReadLock(&pPager->fd);
drh6019e162001-07-02 17:51:45 +00001047 return SQLITE_NOMEM;
1048 }
drhfa86c412002-02-02 15:01:15 +00001049 rc = sqliteOsOpenExclusive(pPager->zJournal, &pPager->jfd, 0);
drh8cfbf082001-09-19 13:22:39 +00001050 if( rc!=SQLITE_OK ){
drh6d4abfb2001-10-22 02:58:08 +00001051 sqliteFree(pPager->aInJournal);
drha7fcb052001-12-14 15:09:55 +00001052 pPager->aInJournal = 0;
1053 sqliteOsReadLock(&pPager->fd);
drhed7c8552001-04-11 14:29:21 +00001054 return SQLITE_CANTOPEN;
1055 }
drh8cfbf082001-09-19 13:22:39 +00001056 pPager->journalOpen = 1;
drhf57b14a2001-09-14 18:54:08 +00001057 pPager->needSync = 0;
drhed7c8552001-04-11 14:29:21 +00001058 pPager->state = SQLITE_WRITELOCK;
drhd9b02572001-04-15 00:37:09 +00001059 sqlitepager_pagecount(pPager);
drh69688d52001-04-14 16:38:23 +00001060 pPager->origDbSize = pPager->dbSize;
drha7fcb052001-12-14 15:09:55 +00001061 rc = sqliteOsWrite(&pPager->jfd, aJournalMagic, sizeof(aJournalMagic));
drhd9b02572001-04-15 00:37:09 +00001062 if( rc==SQLITE_OK ){
drha7fcb052001-12-14 15:09:55 +00001063 rc = sqliteOsWrite(&pPager->jfd, &pPager->dbSize, sizeof(Pgno));
drhd9b02572001-04-15 00:37:09 +00001064 }
1065 if( rc!=SQLITE_OK ){
1066 rc = pager_unwritelock(pPager);
1067 if( rc==SQLITE_OK ) rc = SQLITE_FULL;
1068 return rc;
1069 }
drhed7c8552001-04-11 14:29:21 +00001070 }
drhd9b02572001-04-15 00:37:09 +00001071 assert( pPager->state==SQLITE_WRITELOCK );
drh8cfbf082001-09-19 13:22:39 +00001072 assert( pPager->journalOpen );
drh6446c4d2001-12-15 14:22:18 +00001073
drhfa86c412002-02-02 15:01:15 +00001074 /* The transaction journal now exists and we have a write lock on the
1075 ** main database file. Write the current page to the transaction
1076 ** journal if it is not there already.
drh6446c4d2001-12-15 14:22:18 +00001077 */
drhfa86c412002-02-02 15:01:15 +00001078 if( !pPg->inJournal && (int)pPg->pgno <= pPager->origDbSize ){
drha7fcb052001-12-14 15:09:55 +00001079 rc = sqliteOsWrite(&pPager->jfd, &pPg->pgno, sizeof(Pgno));
drhd9b02572001-04-15 00:37:09 +00001080 if( rc==SQLITE_OK ){
drha7fcb052001-12-14 15:09:55 +00001081 rc = sqliteOsWrite(&pPager->jfd, pData, SQLITE_PAGE_SIZE);
drhd9b02572001-04-15 00:37:09 +00001082 }
1083 if( rc!=SQLITE_OK ){
1084 sqlitepager_rollback(pPager);
1085 pPager->errMask |= PAGER_ERR_FULL;
1086 return rc;
1087 }
drh6019e162001-07-02 17:51:45 +00001088 assert( pPager->aInJournal!=0 );
1089 pPager->aInJournal[pPg->pgno/8] |= 1<<(pPg->pgno&7);
drh603240c2002-03-05 01:11:12 +00001090 pPager->needSync = !pPager->noSync;
drhfa86c412002-02-02 15:01:15 +00001091 pPg->inJournal = 1;
1092 if( pPager->ckptOpen ){
1093 pPager->aInCkpt[pPg->pgno/8] |= 1<<(pPg->pgno&7);
1094 pPg->inCkpt = 1;
1095 }
drh69688d52001-04-14 16:38:23 +00001096 }
drh6446c4d2001-12-15 14:22:18 +00001097
drhfa86c412002-02-02 15:01:15 +00001098 /* If the checkpoint journal is open and the page is not in it,
1099 ** then write the current page to the checkpoint journal.
drh6446c4d2001-12-15 14:22:18 +00001100 */
drh663fc632002-02-02 18:49:19 +00001101 if( pPager->ckptOpen && !pPg->inCkpt && (int)pPg->pgno<=pPager->ckptSize ){
drh1e336b42002-02-14 12:50:33 +00001102 assert( pPg->inJournal || (int)pPg->pgno>pPager->origDbSize );
drhfa86c412002-02-02 15:01:15 +00001103 rc = sqliteOsWrite(&pPager->cpfd, &pPg->pgno, sizeof(Pgno));
1104 if( rc==SQLITE_OK ){
1105 rc = sqliteOsWrite(&pPager->cpfd, pData, SQLITE_PAGE_SIZE);
1106 }
1107 if( rc!=SQLITE_OK ){
1108 sqlitepager_rollback(pPager);
1109 pPager->errMask |= PAGER_ERR_FULL;
1110 return rc;
1111 }
1112 assert( pPager->aInCkpt!=0 );
1113 pPager->aInCkpt[pPg->pgno/8] |= 1<<(pPg->pgno&7);
1114 pPg->inCkpt = 1;
1115 }
1116
1117 /* Update the database size and return.
1118 */
drh1ab43002002-01-14 09:28:19 +00001119 if( pPager->dbSize<(int)pPg->pgno ){
drh306dc212001-05-21 13:45:10 +00001120 pPager->dbSize = pPg->pgno;
1121 }
drh69688d52001-04-14 16:38:23 +00001122 return rc;
drhed7c8552001-04-11 14:29:21 +00001123}
1124
1125/*
drhaacc5432002-01-06 17:07:40 +00001126** Return TRUE if the page given in the argument was previously passed
drh6019e162001-07-02 17:51:45 +00001127** to sqlitepager_write(). In other words, return TRUE if it is ok
1128** to change the content of the page.
1129*/
1130int sqlitepager_iswriteable(void *pData){
1131 PgHdr *pPg = DATA_TO_PGHDR(pData);
1132 return pPg->dirty;
1133}
1134
1135/*
drh30e58752002-03-02 20:41:57 +00001136** A call to this routine tells the pager that it is not necessary to
1137** write the information on page "pgno" back to the disk, even though
1138** that page might be marked as dirty.
1139**
1140** The overlying software layer calls this routine when all of the data
1141** on the given page is unused. The pager marks the page as clean so
1142** that it does not get written to disk.
1143**
1144** Tests show that this optimization, together with the
1145** sqlitepager_dont_rollback() below, more than double the speed
1146** of large INSERT operations and quadruple the speed of large DELETEs.
1147*/
1148void sqlitepager_dont_write(Pager *pPager, Pgno pgno){
1149 PgHdr *pPg;
1150 pPg = pager_lookup(pPager, pgno);
1151 if( pPg && pPg->dirty ){
1152 pPg->dirty = 0;
1153 }
1154}
1155
1156/*
1157** A call to this routine tells the pager that if a rollback occurs,
1158** it is not necessary to restore the data on the given page. This
1159** means that the pager does not have to record the given page in the
1160** rollback journal.
1161*/
1162void sqlitepager_dont_rollback(void *pData){
1163 PgHdr *pPg = DATA_TO_PGHDR(pData);
1164 Pager *pPager = pPg->pPager;
1165
1166 if( pPager->state!=SQLITE_WRITELOCK || pPager->journalOpen==0 ) return;
1167 if( !pPg->inJournal && (int)pPg->pgno <= pPager->origDbSize ){
1168 assert( pPager->aInJournal!=0 );
1169 pPager->aInJournal[pPg->pgno/8] |= 1<<(pPg->pgno&7);
1170 pPg->inJournal = 1;
1171 if( pPager->ckptOpen ){
1172 pPager->aInCkpt[pPg->pgno/8] |= 1<<(pPg->pgno&7);
1173 pPg->inCkpt = 1;
1174 }
1175 }
1176 if( pPager->ckptOpen && !pPg->inCkpt && (int)pPg->pgno<=pPager->ckptSize ){
1177 assert( pPg->inJournal || (int)pPg->pgno>pPager->origDbSize );
1178 assert( pPager->aInCkpt!=0 );
1179 pPager->aInCkpt[pPg->pgno/8] |= 1<<(pPg->pgno&7);
1180 pPg->inCkpt = 1;
1181 }
1182}
1183
1184/*
drhed7c8552001-04-11 14:29:21 +00001185** Commit all changes to the database and release the write lock.
drhd9b02572001-04-15 00:37:09 +00001186**
1187** If the commit fails for any reason, a rollback attempt is made
1188** and an error code is returned. If the commit worked, SQLITE_OK
1189** is returned.
drhed7c8552001-04-11 14:29:21 +00001190*/
drhd9b02572001-04-15 00:37:09 +00001191int sqlitepager_commit(Pager *pPager){
drha1b351a2001-09-14 16:42:12 +00001192 int rc;
drhed7c8552001-04-11 14:29:21 +00001193 PgHdr *pPg;
drhd9b02572001-04-15 00:37:09 +00001194
1195 if( pPager->errMask==PAGER_ERR_FULL ){
1196 rc = sqlitepager_rollback(pPager);
1197 if( rc==SQLITE_OK ) rc = SQLITE_FULL;
1198 return rc;
1199 }
1200 if( pPager->errMask!=0 ){
1201 rc = pager_errcode(pPager);
1202 return rc;
1203 }
1204 if( pPager->state!=SQLITE_WRITELOCK ){
1205 return SQLITE_ERROR;
1206 }
drh8cfbf082001-09-19 13:22:39 +00001207 assert( pPager->journalOpen );
drha7fcb052001-12-14 15:09:55 +00001208 if( pPager->needSync && sqliteOsSync(&pPager->jfd)!=SQLITE_OK ){
drhd9b02572001-04-15 00:37:09 +00001209 goto commit_abort;
drhed7c8552001-04-11 14:29:21 +00001210 }
drha1b351a2001-09-14 16:42:12 +00001211 for(pPg=pPager->pAll; pPg; pPg=pPg->pNextAll){
1212 if( pPg->dirty==0 ) continue;
drha7fcb052001-12-14 15:09:55 +00001213 rc = sqliteOsSeek(&pPager->fd, (pPg->pgno-1)*SQLITE_PAGE_SIZE);
drha1b351a2001-09-14 16:42:12 +00001214 if( rc!=SQLITE_OK ) goto commit_abort;
drha7fcb052001-12-14 15:09:55 +00001215 rc = sqliteOsWrite(&pPager->fd, PGHDR_TO_DATA(pPg), SQLITE_PAGE_SIZE);
drha1b351a2001-09-14 16:42:12 +00001216 if( rc!=SQLITE_OK ) goto commit_abort;
drhed7c8552001-04-11 14:29:21 +00001217 }
drh603240c2002-03-05 01:11:12 +00001218 if( !pPager->noSync && sqliteOsSync(&pPager->fd)!=SQLITE_OK ){
1219 goto commit_abort;
1220 }
drhd9b02572001-04-15 00:37:09 +00001221 rc = pager_unwritelock(pPager);
1222 pPager->dbSize = -1;
1223 return rc;
1224
1225 /* Jump here if anything goes wrong during the commit process.
1226 */
1227commit_abort:
1228 rc = sqlitepager_rollback(pPager);
1229 if( rc==SQLITE_OK ){
1230 rc = SQLITE_FULL;
drhed7c8552001-04-11 14:29:21 +00001231 }
drhed7c8552001-04-11 14:29:21 +00001232 return rc;
1233}
1234
1235/*
1236** Rollback all changes. The database falls back to read-only mode.
1237** All in-memory cache pages revert to their original data contents.
1238** The journal is deleted.
drhd9b02572001-04-15 00:37:09 +00001239**
1240** This routine cannot fail unless some other process is not following
1241** the correct locking protocol (SQLITE_PROTOCOL) or unless some other
1242** process is writing trash into the journal file (SQLITE_CORRUPT) or
1243** unless a prior malloc() failed (SQLITE_NOMEM). Appropriate error
1244** codes are returned for all these occasions. Otherwise,
1245** SQLITE_OK is returned.
drhed7c8552001-04-11 14:29:21 +00001246*/
drhd9b02572001-04-15 00:37:09 +00001247int sqlitepager_rollback(Pager *pPager){
drhed7c8552001-04-11 14:29:21 +00001248 int rc;
drhd9b02572001-04-15 00:37:09 +00001249 if( pPager->errMask!=0 && pPager->errMask!=PAGER_ERR_FULL ){
1250 return pager_errcode(pPager);
drhed7c8552001-04-11 14:29:21 +00001251 }
drhd9b02572001-04-15 00:37:09 +00001252 if( pPager->state!=SQLITE_WRITELOCK ){
1253 return SQLITE_OK;
1254 }
1255 rc = pager_playback(pPager);
1256 if( rc!=SQLITE_OK ){
1257 rc = SQLITE_CORRUPT;
1258 pPager->errMask |= PAGER_ERR_CORRUPT;
1259 }
1260 pPager->dbSize = -1;
drhed7c8552001-04-11 14:29:21 +00001261 return rc;
drh98808ba2001-10-18 12:34:46 +00001262}
drhd9b02572001-04-15 00:37:09 +00001263
1264/*
drh5e00f6c2001-09-13 13:46:56 +00001265** Return TRUE if the database file is opened read-only. Return FALSE
1266** if the database is (in theory) writable.
1267*/
1268int sqlitepager_isreadonly(Pager *pPager){
drhbe0072d2001-09-13 14:46:09 +00001269 return pPager->readOnly;
drh5e00f6c2001-09-13 13:46:56 +00001270}
1271
1272/*
drhd9b02572001-04-15 00:37:09 +00001273** This routine is used for testing and analysis only.
1274*/
1275int *sqlitepager_stats(Pager *pPager){
1276 static int a[9];
1277 a[0] = pPager->nRef;
1278 a[1] = pPager->nPage;
1279 a[2] = pPager->mxPage;
1280 a[3] = pPager->dbSize;
1281 a[4] = pPager->state;
1282 a[5] = pPager->errMask;
1283 a[6] = pPager->nHit;
1284 a[7] = pPager->nMiss;
1285 a[8] = pPager->nOvfl;
1286 return a;
1287}
drhdd793422001-06-28 01:54:48 +00001288
drhfa86c412002-02-02 15:01:15 +00001289/*
1290** Set the checkpoint.
1291**
1292** This routine should be called with the transaction journal already
1293** open. A new checkpoint journal is created that can be used to rollback
drhaaab5722002-02-19 13:39:21 +00001294** changes of a single SQL command within a larger transaction.
drhfa86c412002-02-02 15:01:15 +00001295*/
1296int sqlitepager_ckpt_begin(Pager *pPager){
1297 int rc;
1298 char zTemp[SQLITE_TEMPNAME_SIZE];
1299 assert( pPager->journalOpen );
1300 assert( !pPager->ckptOpen );
1301 pPager->aInCkpt = sqliteMalloc( pPager->dbSize/8 + 1 );
1302 if( pPager->aInCkpt==0 ){
1303 sqliteOsReadLock(&pPager->fd);
1304 return SQLITE_NOMEM;
1305 }
1306 rc = sqliteOsFileSize(&pPager->jfd, &pPager->ckptJSize);
1307 if( rc ) goto ckpt_begin_failed;
drh663fc632002-02-02 18:49:19 +00001308 pPager->ckptSize = pPager->dbSize;
drhfa86c412002-02-02 15:01:15 +00001309 rc = sqlitepager_opentemp(zTemp, &pPager->cpfd);
1310 if( rc ) goto ckpt_begin_failed;
1311 pPager->ckptOpen = 1;
1312 return SQLITE_OK;
1313
1314ckpt_begin_failed:
1315 if( pPager->aInCkpt ){
1316 sqliteFree(pPager->aInCkpt);
1317 pPager->aInCkpt = 0;
1318 }
1319 return rc;
1320}
1321
1322/*
1323** Commit a checkpoint.
1324*/
1325int sqlitepager_ckpt_commit(Pager *pPager){
drh663fc632002-02-02 18:49:19 +00001326 if( pPager->ckptOpen ){
1327 PgHdr *pPg;
1328 sqliteOsClose(&pPager->cpfd);
1329 pPager->ckptOpen = 0;
1330 sqliteFree( pPager->aInCkpt );
1331 pPager->aInCkpt = 0;
1332 for(pPg=pPager->pAll; pPg; pPg=pPg->pNextAll){
1333 pPg->inCkpt = 0;
1334 }
1335 }
drhfa86c412002-02-02 15:01:15 +00001336 return SQLITE_OK;
1337}
1338
1339/*
1340** Rollback a checkpoint.
1341*/
1342int sqlitepager_ckpt_rollback(Pager *pPager){
1343 int rc;
drh663fc632002-02-02 18:49:19 +00001344 if( pPager->ckptOpen ){
1345 rc = pager_ckpt_playback(pPager);
1346 sqlitepager_ckpt_commit(pPager);
1347 }else{
1348 rc = SQLITE_OK;
1349 }
drhfa86c412002-02-02 15:01:15 +00001350 return rc;
1351}
1352
drhdd793422001-06-28 01:54:48 +00001353#if SQLITE_TEST
1354/*
1355** Print a listing of all referenced pages and their ref count.
1356*/
1357void sqlitepager_refdump(Pager *pPager){
1358 PgHdr *pPg;
1359 for(pPg=pPager->pAll; pPg; pPg=pPg->pNextAll){
1360 if( pPg->nRef<=0 ) continue;
1361 printf("PAGE %3d addr=0x%08x nRef=%d\n",
1362 pPg->pgno, (int)PGHDR_TO_DATA(pPg), pPg->nRef);
1363 }
1364}
1365#endif