blob: 1f0fb3aed88b9a3a942cc17ee5fc6922994ebd14 [file] [log] [blame]
drhed7c8552001-04-11 14:29:21 +00001/*
drhb19a2bc2001-09-16 00:13:26 +00002** 2001 September 15
drhed7c8552001-04-11 14:29:21 +00003**
drhb19a2bc2001-09-16 00:13:26 +00004** The author disclaims copyright to this source code. In place of
5** a legal notice, here is a blessing:
drhed7c8552001-04-11 14:29:21 +00006**
drhb19a2bc2001-09-16 00:13:26 +00007** May you do good and not evil.
8** May you find forgiveness for yourself and forgive others.
9** May you share freely, never taking more than you give.
drhed7c8552001-04-11 14:29:21 +000010**
11*************************************************************************
drhb19a2bc2001-09-16 00:13:26 +000012** This is the implementation of the page cache subsystem or "pager".
drhed7c8552001-04-11 14:29:21 +000013**
drhb19a2bc2001-09-16 00:13:26 +000014** The pager is used to access a database disk file. It implements
15** atomic commit and rollback through the use of a journal file that
16** is separate from the database file. The pager also implements file
17** locking to prevent two processes from writing the same database
18** file simultaneously, or one process from reading the database while
19** another is writing.
drhed7c8552001-04-11 14:29:21 +000020**
drh4b845d72002-03-05 12:41:19 +000021** @(#) $Id: pager.c,v 1.43 2002/03/05 12:41:20 drh Exp $
drhed7c8552001-04-11 14:29:21 +000022*/
drhd9b02572001-04-15 00:37:09 +000023#include "sqliteInt.h"
drhed7c8552001-04-11 14:29:21 +000024#include "pager.h"
drh8cfbf082001-09-19 13:22:39 +000025#include "os.h"
drhed7c8552001-04-11 14:29:21 +000026#include <assert.h>
drhd9b02572001-04-15 00:37:09 +000027#include <string.h>
drhed7c8552001-04-11 14:29:21 +000028
29/*
30** The page cache as a whole is always in one of the following
31** states:
32**
33** SQLITE_UNLOCK The page cache is not currently reading or
34** writing the database file. There is no
35** data held in memory. This is the initial
36** state.
37**
38** SQLITE_READLOCK The page cache is reading the database.
39** Writing is not permitted. There can be
40** multiple readers accessing the same database
drh69688d52001-04-14 16:38:23 +000041** file at the same time.
drhed7c8552001-04-11 14:29:21 +000042**
43** SQLITE_WRITELOCK The page cache is writing the database.
44** Access is exclusive. No other processes or
45** threads can be reading or writing while one
46** process is writing.
47**
drh306dc212001-05-21 13:45:10 +000048** The page cache comes up in SQLITE_UNLOCK. The first time a
49** sqlite_page_get() occurs, the state transitions to SQLITE_READLOCK.
drhed7c8552001-04-11 14:29:21 +000050** After all pages have been released using sqlite_page_unref(),
drh306dc212001-05-21 13:45:10 +000051** the state transitions back to SQLITE_UNLOCK. The first time
drhed7c8552001-04-11 14:29:21 +000052** that sqlite_page_write() is called, the state transitions to
drh306dc212001-05-21 13:45:10 +000053** SQLITE_WRITELOCK. (Note that sqlite_page_write() can only be
54** called on an outstanding page which means that the pager must
55** be in SQLITE_READLOCK before it transitions to SQLITE_WRITELOCK.)
56** The sqlite_page_rollback() and sqlite_page_commit() functions
57** transition the state from SQLITE_WRITELOCK back to SQLITE_READLOCK.
drhed7c8552001-04-11 14:29:21 +000058*/
59#define SQLITE_UNLOCK 0
60#define SQLITE_READLOCK 1
61#define SQLITE_WRITELOCK 2
62
drhd9b02572001-04-15 00:37:09 +000063
drhed7c8552001-04-11 14:29:21 +000064/*
65** Each in-memory image of a page begins with the following header.
drhbd03cae2001-06-02 02:40:57 +000066** This header is only visible to this pager module. The client
67** code that calls pager sees only the data that follows the header.
drhed7c8552001-04-11 14:29:21 +000068*/
drhd9b02572001-04-15 00:37:09 +000069typedef struct PgHdr PgHdr;
drhed7c8552001-04-11 14:29:21 +000070struct PgHdr {
71 Pager *pPager; /* The pager to which this page belongs */
72 Pgno pgno; /* The page number for this page */
drh69688d52001-04-14 16:38:23 +000073 PgHdr *pNextHash, *pPrevHash; /* Hash collision chain for PgHdr.pgno */
drhed7c8552001-04-11 14:29:21 +000074 int nRef; /* Number of users of this page */
drhd9b02572001-04-15 00:37:09 +000075 PgHdr *pNextFree, *pPrevFree; /* Freelist of pages where nRef==0 */
76 PgHdr *pNextAll, *pPrevAll; /* A list of all pages */
drhed7c8552001-04-11 14:29:21 +000077 char inJournal; /* TRUE if has been written to journal */
drhfa86c412002-02-02 15:01:15 +000078 char inCkpt; /* TRUE if written to the checkpoint journal */
drhed7c8552001-04-11 14:29:21 +000079 char dirty; /* TRUE if we need to write back changes */
drh69688d52001-04-14 16:38:23 +000080 /* SQLITE_PAGE_SIZE bytes of page data follow this header */
drh7e3b0a02001-04-28 16:52:40 +000081 /* Pager.nExtra bytes of local data follow the page data */
drhed7c8552001-04-11 14:29:21 +000082};
83
84/*
drh69688d52001-04-14 16:38:23 +000085** Convert a pointer to a PgHdr into a pointer to its data
86** and back again.
drhed7c8552001-04-11 14:29:21 +000087*/
88#define PGHDR_TO_DATA(P) ((void*)(&(P)[1]))
89#define DATA_TO_PGHDR(D) (&((PgHdr*)(D))[-1])
drh7e3b0a02001-04-28 16:52:40 +000090#define PGHDR_TO_EXTRA(P) ((void*)&((char*)(&(P)[1]))[SQLITE_PAGE_SIZE])
drhed7c8552001-04-11 14:29:21 +000091
92/*
drhed7c8552001-04-11 14:29:21 +000093** How big to make the hash table used for locating in-memory pages
drh306dc212001-05-21 13:45:10 +000094** by page number. Knuth says this should be a prime number.
drhed7c8552001-04-11 14:29:21 +000095*/
drh603240c2002-03-05 01:11:12 +000096#define N_PG_HASH 2003
drhed7c8552001-04-11 14:29:21 +000097
98/*
99** A open page cache is an instance of the following structure.
100*/
101struct Pager {
102 char *zFilename; /* Name of the database file */
103 char *zJournal; /* Name of the journal file */
drh8cfbf082001-09-19 13:22:39 +0000104 OsFile fd, jfd; /* File descriptors for database and journal */
drhfa86c412002-02-02 15:01:15 +0000105 OsFile cpfd; /* File descriptor for the checkpoint journal */
drhed7c8552001-04-11 14:29:21 +0000106 int dbSize; /* Number of pages in the file */
drh69688d52001-04-14 16:38:23 +0000107 int origDbSize; /* dbSize before the current change */
drhfa86c412002-02-02 15:01:15 +0000108 int ckptSize, ckptJSize; /* Size of database and journal at ckpt_begin() */
drh7e3b0a02001-04-28 16:52:40 +0000109 int nExtra; /* Add this many bytes to each in-memory page */
drh72f82862001-05-24 21:06:34 +0000110 void (*xDestructor)(void*); /* Call this routine when freeing pages */
drhed7c8552001-04-11 14:29:21 +0000111 int nPage; /* Total number of in-memory pages */
drhd9b02572001-04-15 00:37:09 +0000112 int nRef; /* Number of in-memory pages with PgHdr.nRef>0 */
drhed7c8552001-04-11 14:29:21 +0000113 int mxPage; /* Maximum number of pages to hold in cache */
drhd9b02572001-04-15 00:37:09 +0000114 int nHit, nMiss, nOvfl; /* Cache hits, missing, and LRU overflows */
drh603240c2002-03-05 01:11:12 +0000115 u8 journalOpen; /* True if journal file descriptors is valid */
116 u8 ckptOpen; /* True if the checkpoint journal is open */
117 u8 noSync; /* Do not sync the journal if true */
118 u8 state; /* SQLITE_UNLOCK, _READLOCK or _WRITELOCK */
119 u8 errMask; /* One of several kinds of errors */
120 u8 tempFile; /* zFilename is a temporary file */
121 u8 readOnly; /* True for a read-only database */
122 u8 needSync; /* True if an fsync() is needed on the journal */
123 u8 *aInJournal; /* One bit for each page in the database file */
124 u8 *aInCkpt; /* One bit for each page in the database */
drhed7c8552001-04-11 14:29:21 +0000125 PgHdr *pFirst, *pLast; /* List of free pages */
drhd9b02572001-04-15 00:37:09 +0000126 PgHdr *pAll; /* List of all pages */
drhed7c8552001-04-11 14:29:21 +0000127 PgHdr *aHash[N_PG_HASH]; /* Hash table to map page number of PgHdr */
drhd9b02572001-04-15 00:37:09 +0000128};
129
130/*
131** These are bits that can be set in Pager.errMask.
132*/
133#define PAGER_ERR_FULL 0x01 /* a write() failed */
134#define PAGER_ERR_MEM 0x02 /* malloc() failed */
135#define PAGER_ERR_LOCK 0x04 /* error in the locking protocol */
136#define PAGER_ERR_CORRUPT 0x08 /* database or journal corruption */
drh81a20f22001-10-12 17:30:04 +0000137#define PAGER_ERR_DISK 0x10 /* general disk I/O error - bad hard drive? */
drhd9b02572001-04-15 00:37:09 +0000138
139/*
140** The journal file contains page records in the following
141** format.
142*/
143typedef struct PageRecord PageRecord;
144struct PageRecord {
145 Pgno pgno; /* The page number */
146 char aData[SQLITE_PAGE_SIZE]; /* Original data for page pgno */
147};
148
149/*
drh5e00f6c2001-09-13 13:46:56 +0000150** Journal files begin with the following magic string. The data
151** was obtained from /dev/random. It is used only as a sanity check.
drhd9b02572001-04-15 00:37:09 +0000152*/
153static const unsigned char aJournalMagic[] = {
154 0xd9, 0xd5, 0x05, 0xf9, 0x20, 0xa1, 0x63, 0xd4,
drhed7c8552001-04-11 14:29:21 +0000155};
156
157/*
158** Hash a page number
159*/
drhd9b02572001-04-15 00:37:09 +0000160#define pager_hash(PN) ((PN)%N_PG_HASH)
drhed7c8552001-04-11 14:29:21 +0000161
162/*
drhdd793422001-06-28 01:54:48 +0000163** Enable reference count tracking here:
164*/
165#if SQLITE_TEST
drh5e00f6c2001-09-13 13:46:56 +0000166 int pager_refinfo_enable = 0;
drhdd793422001-06-28 01:54:48 +0000167 static void pager_refinfo(PgHdr *p){
168 static int cnt = 0;
169 if( !pager_refinfo_enable ) return;
170 printf(
171 "REFCNT: %4d addr=0x%08x nRef=%d\n",
172 p->pgno, (int)PGHDR_TO_DATA(p), p->nRef
173 );
174 cnt++; /* Something to set a breakpoint on */
175 }
176# define REFINFO(X) pager_refinfo(X)
177#else
178# define REFINFO(X)
179#endif
180
181/*
drhd9b02572001-04-15 00:37:09 +0000182** Convert the bits in the pPager->errMask into an approprate
183** return code.
184*/
185static int pager_errcode(Pager *pPager){
186 int rc = SQLITE_OK;
187 if( pPager->errMask & PAGER_ERR_LOCK ) rc = SQLITE_PROTOCOL;
drh81a20f22001-10-12 17:30:04 +0000188 if( pPager->errMask & PAGER_ERR_DISK ) rc = SQLITE_IOERR;
drhd9b02572001-04-15 00:37:09 +0000189 if( pPager->errMask & PAGER_ERR_FULL ) rc = SQLITE_FULL;
190 if( pPager->errMask & PAGER_ERR_MEM ) rc = SQLITE_NOMEM;
191 if( pPager->errMask & PAGER_ERR_CORRUPT ) rc = SQLITE_CORRUPT;
192 return rc;
drhed7c8552001-04-11 14:29:21 +0000193}
194
195/*
196** Find a page in the hash table given its page number. Return
197** a pointer to the page or NULL if not found.
198*/
drhd9b02572001-04-15 00:37:09 +0000199static PgHdr *pager_lookup(Pager *pPager, Pgno pgno){
drhed7c8552001-04-11 14:29:21 +0000200 PgHdr *p = pPager->aHash[pgno % N_PG_HASH];
201 while( p && p->pgno!=pgno ){
202 p = p->pNextHash;
203 }
204 return p;
205}
206
207/*
208** Unlock the database and clear the in-memory cache. This routine
209** sets the state of the pager back to what it was when it was first
210** opened. Any outstanding pages are invalidated and subsequent attempts
211** to access those pages will likely result in a coredump.
212*/
drhd9b02572001-04-15 00:37:09 +0000213static void pager_reset(Pager *pPager){
drhed7c8552001-04-11 14:29:21 +0000214 PgHdr *pPg, *pNext;
drhd9b02572001-04-15 00:37:09 +0000215 for(pPg=pPager->pAll; pPg; pPg=pNext){
216 pNext = pPg->pNextAll;
217 sqliteFree(pPg);
drhed7c8552001-04-11 14:29:21 +0000218 }
219 pPager->pFirst = 0;
drhd9b02572001-04-15 00:37:09 +0000220 pPager->pLast = 0;
221 pPager->pAll = 0;
drhed7c8552001-04-11 14:29:21 +0000222 memset(pPager->aHash, 0, sizeof(pPager->aHash));
223 pPager->nPage = 0;
drhfa86c412002-02-02 15:01:15 +0000224 if( pPager->state>=SQLITE_WRITELOCK ){
drhd9b02572001-04-15 00:37:09 +0000225 sqlitepager_rollback(pPager);
drhed7c8552001-04-11 14:29:21 +0000226 }
drha7fcb052001-12-14 15:09:55 +0000227 sqliteOsUnlock(&pPager->fd);
drhed7c8552001-04-11 14:29:21 +0000228 pPager->state = SQLITE_UNLOCK;
drhd9b02572001-04-15 00:37:09 +0000229 pPager->dbSize = -1;
drhed7c8552001-04-11 14:29:21 +0000230 pPager->nRef = 0;
drh8cfbf082001-09-19 13:22:39 +0000231 assert( pPager->journalOpen==0 );
drhed7c8552001-04-11 14:29:21 +0000232}
233
234/*
235** When this routine is called, the pager has the journal file open and
236** a write lock on the database. This routine releases the database
237** write lock and acquires a read lock in its place. The journal file
238** is deleted and closed.
drhed7c8552001-04-11 14:29:21 +0000239*/
drhd9b02572001-04-15 00:37:09 +0000240static int pager_unwritelock(Pager *pPager){
drhed7c8552001-04-11 14:29:21 +0000241 int rc;
drhd9b02572001-04-15 00:37:09 +0000242 PgHdr *pPg;
drhfa86c412002-02-02 15:01:15 +0000243 if( pPager->state<SQLITE_WRITELOCK ) return SQLITE_OK;
drh663fc632002-02-02 18:49:19 +0000244 sqlitepager_ckpt_commit(pPager);
drha7fcb052001-12-14 15:09:55 +0000245 sqliteOsClose(&pPager->jfd);
drh8cfbf082001-09-19 13:22:39 +0000246 pPager->journalOpen = 0;
247 sqliteOsDelete(pPager->zJournal);
drha7fcb052001-12-14 15:09:55 +0000248 rc = sqliteOsReadLock(&pPager->fd);
249 assert( rc==SQLITE_OK );
drh6019e162001-07-02 17:51:45 +0000250 sqliteFree( pPager->aInJournal );
251 pPager->aInJournal = 0;
drhd9b02572001-04-15 00:37:09 +0000252 for(pPg=pPager->pAll; pPg; pPg=pPg->pNextAll){
253 pPg->inJournal = 0;
254 pPg->dirty = 0;
255 }
drha7fcb052001-12-14 15:09:55 +0000256 pPager->state = SQLITE_READLOCK;
drhed7c8552001-04-11 14:29:21 +0000257 return rc;
258}
259
drhed7c8552001-04-11 14:29:21 +0000260/*
drhfa86c412002-02-02 15:01:15 +0000261** Read a single page from the journal file opened on file descriptor
262** jfd. Playback this one page.
263*/
264static int pager_playback_one_page(Pager *pPager, OsFile *jfd){
265 int rc;
266 PgHdr *pPg; /* An existing page in the cache */
267 PageRecord pgRec;
268
drh663fc632002-02-02 18:49:19 +0000269 rc = sqliteOsRead(jfd, &pgRec, sizeof(pgRec));
drhfa86c412002-02-02 15:01:15 +0000270 if( rc!=SQLITE_OK ) return rc;
271
272 /* Sanity checking on the page */
273 if( pgRec.pgno>pPager->dbSize || pgRec.pgno==0 ) return SQLITE_CORRUPT;
274
275 /* Playback the page. Update the in-memory copy of the page
276 ** at the same time, if there is one.
277 */
278 pPg = pager_lookup(pPager, pgRec.pgno);
279 if( pPg ){
280 memcpy(PGHDR_TO_DATA(pPg), pgRec.aData, SQLITE_PAGE_SIZE);
281 memset(PGHDR_TO_EXTRA(pPg), 0, pPager->nExtra);
282 }
283 rc = sqliteOsSeek(&pPager->fd, (pgRec.pgno-1)*SQLITE_PAGE_SIZE);
284 if( rc==SQLITE_OK ){
285 rc = sqliteOsWrite(&pPager->fd, pgRec.aData, SQLITE_PAGE_SIZE);
286 }
287 return rc;
288}
289
290/*
drhed7c8552001-04-11 14:29:21 +0000291** Playback the journal and thus restore the database file to
292** the state it was in before we started making changes.
293**
drhd9b02572001-04-15 00:37:09 +0000294** The journal file format is as follows: There is an initial
295** file-type string for sanity checking. Then there is a single
296** Pgno number which is the number of pages in the database before
297** changes were made. The database is truncated to this size.
drh306dc212001-05-21 13:45:10 +0000298** Next come zero or more page records where each page record
299** consists of a Pgno and SQLITE_PAGE_SIZE bytes of data. See
300** the PageRecord structure for details.
drhed7c8552001-04-11 14:29:21 +0000301**
drhd9b02572001-04-15 00:37:09 +0000302** If the file opened as the journal file is not a well-formed
303** journal file (as determined by looking at the magic number
304** at the beginning) then this routine returns SQLITE_PROTOCOL.
305** If any other errors occur during playback, the database will
306** likely be corrupted, so the PAGER_ERR_CORRUPT bit is set in
307** pPager->errMask and SQLITE_CORRUPT is returned. If it all
308** works, then this routine returns SQLITE_OK.
drhed7c8552001-04-11 14:29:21 +0000309*/
drhd9b02572001-04-15 00:37:09 +0000310static int pager_playback(Pager *pPager){
311 int nRec; /* Number of Records */
312 int i; /* Loop counter */
313 Pgno mxPg = 0; /* Size of the original file in pages */
drhd9b02572001-04-15 00:37:09 +0000314 unsigned char aMagic[sizeof(aJournalMagic)];
drhed7c8552001-04-11 14:29:21 +0000315 int rc;
316
drhc3a64ba2001-11-22 00:01:27 +0000317 /* Figure out how many records are in the journal. Abort early if
318 ** the journal is empty.
drhed7c8552001-04-11 14:29:21 +0000319 */
drh8cfbf082001-09-19 13:22:39 +0000320 assert( pPager->journalOpen );
drha7fcb052001-12-14 15:09:55 +0000321 sqliteOsSeek(&pPager->jfd, 0);
322 rc = sqliteOsFileSize(&pPager->jfd, &nRec);
drhc3a64ba2001-11-22 00:01:27 +0000323 if( rc!=SQLITE_OK ){
324 goto end_playback;
325 }
326 nRec = (nRec - (sizeof(aMagic)+sizeof(Pgno))) / sizeof(PageRecord);
327 if( nRec<=0 ){
328 goto end_playback;
329 }
330
331 /* Read the beginning of the journal and truncate the
332 ** database file back to its original size.
333 */
drha7fcb052001-12-14 15:09:55 +0000334 rc = sqliteOsRead(&pPager->jfd, aMagic, sizeof(aMagic));
drhd9b02572001-04-15 00:37:09 +0000335 if( rc!=SQLITE_OK || memcmp(aMagic,aJournalMagic,sizeof(aMagic))!=0 ){
drh81a20f22001-10-12 17:30:04 +0000336 rc = SQLITE_PROTOCOL;
337 goto end_playback;
drhd9b02572001-04-15 00:37:09 +0000338 }
drha7fcb052001-12-14 15:09:55 +0000339 rc = sqliteOsRead(&pPager->jfd, &mxPg, sizeof(mxPg));
drhd9b02572001-04-15 00:37:09 +0000340 if( rc!=SQLITE_OK ){
drh81a20f22001-10-12 17:30:04 +0000341 goto end_playback;
drhd9b02572001-04-15 00:37:09 +0000342 }
drha7fcb052001-12-14 15:09:55 +0000343 rc = sqliteOsTruncate(&pPager->fd, mxPg*SQLITE_PAGE_SIZE);
drh81a20f22001-10-12 17:30:04 +0000344 if( rc!=SQLITE_OK ){
345 goto end_playback;
346 }
drhd9b02572001-04-15 00:37:09 +0000347 pPager->dbSize = mxPg;
348
drhfa86c412002-02-02 15:01:15 +0000349 /* Copy original pages out of the journal and back into the database file.
drhed7c8552001-04-11 14:29:21 +0000350 */
drhd9b02572001-04-15 00:37:09 +0000351 for(i=nRec-1; i>=0; i--){
drhfa86c412002-02-02 15:01:15 +0000352 rc = pager_playback_one_page(pPager, &pPager->jfd);
drhd9b02572001-04-15 00:37:09 +0000353 if( rc!=SQLITE_OK ) break;
drhed7c8552001-04-11 14:29:21 +0000354 }
drh81a20f22001-10-12 17:30:04 +0000355
356end_playback:
drhd9b02572001-04-15 00:37:09 +0000357 if( rc!=SQLITE_OK ){
358 pager_unwritelock(pPager);
359 pPager->errMask |= PAGER_ERR_CORRUPT;
360 rc = SQLITE_CORRUPT;
361 }else{
362 rc = pager_unwritelock(pPager);
drhed7c8552001-04-11 14:29:21 +0000363 }
drhd9b02572001-04-15 00:37:09 +0000364 return rc;
drhed7c8552001-04-11 14:29:21 +0000365}
366
367/*
drhfa86c412002-02-02 15:01:15 +0000368** Playback the checkpoint journal.
369**
370** This is similar to playing back the transaction journal but with
371** a few extra twists.
372**
drh663fc632002-02-02 18:49:19 +0000373** (1) The number of pages in the database file at the start of
374** the checkpoint is stored in pPager->ckptSize, not in the
375** journal file itself.
drhfa86c412002-02-02 15:01:15 +0000376**
377** (2) In addition to playing back the checkpoint journal, also
378** playback all pages of the transaction journal beginning
379** at offset pPager->ckptJSize.
380*/
381static int pager_ckpt_playback(Pager *pPager){
382 int nRec; /* Number of Records */
383 int i; /* Loop counter */
384 int rc;
385
386 /* Truncate the database back to its original size.
387 */
drh663fc632002-02-02 18:49:19 +0000388 rc = sqliteOsTruncate(&pPager->fd, pPager->ckptSize*SQLITE_PAGE_SIZE);
drhfa86c412002-02-02 15:01:15 +0000389 pPager->dbSize = pPager->ckptSize;
390
391 /* Figure out how many records are in the checkpoint journal.
392 */
393 assert( pPager->ckptOpen && pPager->journalOpen );
394 sqliteOsSeek(&pPager->cpfd, 0);
395 rc = sqliteOsFileSize(&pPager->cpfd, &nRec);
396 if( rc!=SQLITE_OK ){
397 goto end_ckpt_playback;
398 }
399 nRec /= sizeof(PageRecord);
400
401 /* Copy original pages out of the checkpoint journal and back into the
402 ** database file.
403 */
404 for(i=nRec-1; i>=0; i--){
405 rc = pager_playback_one_page(pPager, &pPager->cpfd);
406 if( rc!=SQLITE_OK ) goto end_ckpt_playback;
407 }
408
409 /* Figure out how many pages need to be copied out of the transaction
410 ** journal.
411 */
412 rc = sqliteOsSeek(&pPager->jfd, pPager->ckptJSize);
413 if( rc!=SQLITE_OK ){
414 goto end_ckpt_playback;
415 }
416 rc = sqliteOsFileSize(&pPager->jfd, &nRec);
417 if( rc!=SQLITE_OK ){
418 goto end_ckpt_playback;
419 }
420 nRec = (nRec - pPager->ckptJSize)/sizeof(PageRecord);
421 for(i=nRec-1; i>=0; i--){
422 rc = pager_playback_one_page(pPager, &pPager->jfd);
423 if( rc!=SQLITE_OK ) goto end_ckpt_playback;
424 }
425
426
427end_ckpt_playback:
drhfa86c412002-02-02 15:01:15 +0000428 if( rc!=SQLITE_OK ){
drhfa86c412002-02-02 15:01:15 +0000429 pPager->errMask |= PAGER_ERR_CORRUPT;
430 rc = SQLITE_CORRUPT;
drhfa86c412002-02-02 15:01:15 +0000431 }
432 return rc;
433}
434
435/*
drhf57b14a2001-09-14 18:54:08 +0000436** Change the maximum number of in-memory pages that are allowed.
437*/
438void sqlitepager_set_cachesize(Pager *pPager, int mxPage){
drh603240c2002-03-05 01:11:12 +0000439 if( mxPage>=0 ){
440 pPager->noSync = 0;
441 }else{
442 pPager->noSync = 1;
443 mxPage = -mxPage;
444 }
drhf57b14a2001-09-14 18:54:08 +0000445 if( mxPage>10 ){
446 pPager->mxPage = mxPage;
447 }
448}
449
450/*
drhfa86c412002-02-02 15:01:15 +0000451** Open a temporary file. Write the name of the file into zName
452** (zName must be at least SQLITE_TEMPNAME_SIZE bytes long.) Write
453** the file descriptor into *fd. Return SQLITE_OK on success or some
454** other error code if we fail.
455**
456** The OS will automatically delete the temporary file when it is
457** closed.
458*/
459static int sqlitepager_opentemp(char *zFile, OsFile *fd){
460 int cnt = 8;
461 int rc;
462 do{
463 cnt--;
464 sqliteOsTempFileName(zFile);
465 rc = sqliteOsOpenExclusive(zFile, fd, 1);
466 }while( cnt>0 && rc!=SQLITE_OK );
467 return rc;
468}
469
470/*
drhed7c8552001-04-11 14:29:21 +0000471** Create a new page cache and put a pointer to the page cache in *ppPager.
drh5e00f6c2001-09-13 13:46:56 +0000472** The file to be cached need not exist. The file is not locked until
drhd9b02572001-04-15 00:37:09 +0000473** the first call to sqlitepager_get() and is only held open until the
474** last page is released using sqlitepager_unref().
drh382c0242001-10-06 16:33:02 +0000475**
drh6446c4d2001-12-15 14:22:18 +0000476** If zFilename is NULL then a randomly-named temporary file is created
477** and used as the file to be cached. The file will be deleted
478** automatically when it is closed.
drhed7c8552001-04-11 14:29:21 +0000479*/
drh7e3b0a02001-04-28 16:52:40 +0000480int sqlitepager_open(
481 Pager **ppPager, /* Return the Pager structure here */
482 const char *zFilename, /* Name of the database file to open */
483 int mxPage, /* Max number of in-memory cache pages */
484 int nExtra /* Extra bytes append to each in-memory page */
485){
drhed7c8552001-04-11 14:29:21 +0000486 Pager *pPager;
487 int nameLen;
drh8cfbf082001-09-19 13:22:39 +0000488 OsFile fd;
489 int rc;
drh5e00f6c2001-09-13 13:46:56 +0000490 int tempFile;
491 int readOnly = 0;
drh8cfbf082001-09-19 13:22:39 +0000492 char zTemp[SQLITE_TEMPNAME_SIZE];
drhed7c8552001-04-11 14:29:21 +0000493
drhd9b02572001-04-15 00:37:09 +0000494 *ppPager = 0;
495 if( sqlite_malloc_failed ){
496 return SQLITE_NOMEM;
497 }
drh5e00f6c2001-09-13 13:46:56 +0000498 if( zFilename ){
drh8cfbf082001-09-19 13:22:39 +0000499 rc = sqliteOsOpenReadWrite(zFilename, &fd, &readOnly);
drh5e00f6c2001-09-13 13:46:56 +0000500 tempFile = 0;
501 }else{
drhfa86c412002-02-02 15:01:15 +0000502 rc = sqlitepager_opentemp(zTemp, &fd);
drh5e00f6c2001-09-13 13:46:56 +0000503 zFilename = zTemp;
504 tempFile = 1;
505 }
drh8cfbf082001-09-19 13:22:39 +0000506 if( rc!=SQLITE_OK ){
drhed7c8552001-04-11 14:29:21 +0000507 return SQLITE_CANTOPEN;
508 }
509 nameLen = strlen(zFilename);
510 pPager = sqliteMalloc( sizeof(*pPager) + nameLen*2 + 30 );
drhd9b02572001-04-15 00:37:09 +0000511 if( pPager==0 ){
drha7fcb052001-12-14 15:09:55 +0000512 sqliteOsClose(&fd);
drhd9b02572001-04-15 00:37:09 +0000513 return SQLITE_NOMEM;
514 }
drhed7c8552001-04-11 14:29:21 +0000515 pPager->zFilename = (char*)&pPager[1];
516 pPager->zJournal = &pPager->zFilename[nameLen+1];
517 strcpy(pPager->zFilename, zFilename);
518 strcpy(pPager->zJournal, zFilename);
519 strcpy(&pPager->zJournal[nameLen], "-journal");
520 pPager->fd = fd;
drh8cfbf082001-09-19 13:22:39 +0000521 pPager->journalOpen = 0;
drhfa86c412002-02-02 15:01:15 +0000522 pPager->ckptOpen = 0;
drhed7c8552001-04-11 14:29:21 +0000523 pPager->nRef = 0;
524 pPager->dbSize = -1;
drhfa86c412002-02-02 15:01:15 +0000525 pPager->ckptSize = 0;
526 pPager->ckptJSize = 0;
drhed7c8552001-04-11 14:29:21 +0000527 pPager->nPage = 0;
drhd79caeb2001-04-15 02:27:24 +0000528 pPager->mxPage = mxPage>5 ? mxPage : 10;
drhed7c8552001-04-11 14:29:21 +0000529 pPager->state = SQLITE_UNLOCK;
drhd9b02572001-04-15 00:37:09 +0000530 pPager->errMask = 0;
drh5e00f6c2001-09-13 13:46:56 +0000531 pPager->tempFile = tempFile;
532 pPager->readOnly = readOnly;
drhf57b14a2001-09-14 18:54:08 +0000533 pPager->needSync = 0;
drhed7c8552001-04-11 14:29:21 +0000534 pPager->pFirst = 0;
535 pPager->pLast = 0;
drh7c717f72001-06-24 20:39:41 +0000536 pPager->nExtra = nExtra;
drhed7c8552001-04-11 14:29:21 +0000537 memset(pPager->aHash, 0, sizeof(pPager->aHash));
538 *ppPager = pPager;
539 return SQLITE_OK;
540}
541
542/*
drh72f82862001-05-24 21:06:34 +0000543** Set the destructor for this pager. If not NULL, the destructor is called
drh5e00f6c2001-09-13 13:46:56 +0000544** when the reference count on each page reaches zero. The destructor can
545** be used to clean up information in the extra segment appended to each page.
drh72f82862001-05-24 21:06:34 +0000546**
547** The destructor is not called as a result sqlitepager_close().
548** Destructors are only called by sqlitepager_unref().
549*/
550void sqlitepager_set_destructor(Pager *pPager, void (*xDesc)(void*)){
551 pPager->xDestructor = xDesc;
552}
553
554/*
drh5e00f6c2001-09-13 13:46:56 +0000555** Return the total number of pages in the disk file associated with
556** pPager.
drhed7c8552001-04-11 14:29:21 +0000557*/
drhd9b02572001-04-15 00:37:09 +0000558int sqlitepager_pagecount(Pager *pPager){
drhed7c8552001-04-11 14:29:21 +0000559 int n;
drhd9b02572001-04-15 00:37:09 +0000560 assert( pPager!=0 );
drhed7c8552001-04-11 14:29:21 +0000561 if( pPager->dbSize>=0 ){
562 return pPager->dbSize;
563 }
drha7fcb052001-12-14 15:09:55 +0000564 if( sqliteOsFileSize(&pPager->fd, &n)!=SQLITE_OK ){
drh81a20f22001-10-12 17:30:04 +0000565 pPager->errMask |= PAGER_ERR_DISK;
drh8cfbf082001-09-19 13:22:39 +0000566 return 0;
drhed7c8552001-04-11 14:29:21 +0000567 }
drh8cfbf082001-09-19 13:22:39 +0000568 n /= SQLITE_PAGE_SIZE;
drhd9b02572001-04-15 00:37:09 +0000569 if( pPager->state!=SQLITE_UNLOCK ){
drhed7c8552001-04-11 14:29:21 +0000570 pPager->dbSize = n;
571 }
572 return n;
573}
574
575/*
576** Shutdown the page cache. Free all memory and close all files.
577**
578** If a transaction was in progress when this routine is called, that
579** transaction is rolled back. All outstanding pages are invalidated
580** and their memory is freed. Any attempt to use a page associated
581** with this page cache after this function returns will likely
582** result in a coredump.
583*/
drhd9b02572001-04-15 00:37:09 +0000584int sqlitepager_close(Pager *pPager){
585 PgHdr *pPg, *pNext;
drhed7c8552001-04-11 14:29:21 +0000586 switch( pPager->state ){
587 case SQLITE_WRITELOCK: {
drhd9b02572001-04-15 00:37:09 +0000588 sqlitepager_rollback(pPager);
drha7fcb052001-12-14 15:09:55 +0000589 sqliteOsUnlock(&pPager->fd);
drh8cfbf082001-09-19 13:22:39 +0000590 assert( pPager->journalOpen==0 );
drhed7c8552001-04-11 14:29:21 +0000591 break;
592 }
593 case SQLITE_READLOCK: {
drha7fcb052001-12-14 15:09:55 +0000594 sqliteOsUnlock(&pPager->fd);
drhed7c8552001-04-11 14:29:21 +0000595 break;
596 }
597 default: {
598 /* Do nothing */
599 break;
600 }
601 }
drhd9b02572001-04-15 00:37:09 +0000602 for(pPg=pPager->pAll; pPg; pPg=pNext){
603 pNext = pPg->pNextAll;
604 sqliteFree(pPg);
drhed7c8552001-04-11 14:29:21 +0000605 }
drha7fcb052001-12-14 15:09:55 +0000606 sqliteOsClose(&pPager->fd);
drh8cfbf082001-09-19 13:22:39 +0000607 assert( pPager->journalOpen==0 );
drh5e00f6c2001-09-13 13:46:56 +0000608 if( pPager->tempFile ){
drhfa86c412002-02-02 15:01:15 +0000609 /* sqliteOsDelete(pPager->zFilename); */
drh5e00f6c2001-09-13 13:46:56 +0000610 }
drhed7c8552001-04-11 14:29:21 +0000611 sqliteFree(pPager);
612 return SQLITE_OK;
613}
614
615/*
drh5e00f6c2001-09-13 13:46:56 +0000616** Return the page number for the given page data.
drhed7c8552001-04-11 14:29:21 +0000617*/
drhd9b02572001-04-15 00:37:09 +0000618Pgno sqlitepager_pagenumber(void *pData){
drhed7c8552001-04-11 14:29:21 +0000619 PgHdr *p = DATA_TO_PGHDR(pData);
620 return p->pgno;
621}
622
623/*
drh7e3b0a02001-04-28 16:52:40 +0000624** Increment the reference count for a page. If the page is
625** currently on the freelist (the reference count is zero) then
626** remove it from the freelist.
627*/
drhdf0b3b02001-06-23 11:36:20 +0000628static void page_ref(PgHdr *pPg){
drh7e3b0a02001-04-28 16:52:40 +0000629 if( pPg->nRef==0 ){
630 /* The page is currently on the freelist. Remove it. */
631 if( pPg->pPrevFree ){
632 pPg->pPrevFree->pNextFree = pPg->pNextFree;
633 }else{
634 pPg->pPager->pFirst = pPg->pNextFree;
635 }
636 if( pPg->pNextFree ){
637 pPg->pNextFree->pPrevFree = pPg->pPrevFree;
638 }else{
639 pPg->pPager->pLast = pPg->pPrevFree;
640 }
641 pPg->pPager->nRef++;
642 }
643 pPg->nRef++;
drhdd793422001-06-28 01:54:48 +0000644 REFINFO(pPg);
drhdf0b3b02001-06-23 11:36:20 +0000645}
646
647/*
648** Increment the reference count for a page. The input pointer is
649** a reference to the page data.
650*/
651int sqlitepager_ref(void *pData){
652 PgHdr *pPg = DATA_TO_PGHDR(pData);
653 page_ref(pPg);
drh8c42ca92001-06-22 19:15:00 +0000654 return SQLITE_OK;
drh7e3b0a02001-04-28 16:52:40 +0000655}
656
657/*
drhb19a2bc2001-09-16 00:13:26 +0000658** Sync the journal and then write all free dirty pages to the database
659** file.
660**
661** Writing all free dirty pages to the database after the sync is a
662** non-obvious optimization. fsync() is an expensive operation so we
drhaaab5722002-02-19 13:39:21 +0000663** want to minimize the number ot times it is called. After an fsync() call,
drh6446c4d2001-12-15 14:22:18 +0000664** we are free to write dirty pages back to the database. It is best
665** to go ahead and write as many dirty pages as possible to minimize
666** the risk of having to do another fsync() later on. Writing dirty
667** free pages in this way was observed to make database operations go
668** up to 10 times faster.
drhfa86c412002-02-02 15:01:15 +0000669**
670** If we are writing to temporary database, there is no need to preserve
671** the integrity of the journal file, so we can save time and skip the
672** fsync().
drh50e5dad2001-09-15 00:57:28 +0000673*/
674static int syncAllPages(Pager *pPager){
675 PgHdr *pPg;
676 int rc = SQLITE_OK;
677 if( pPager->needSync ){
drhfa86c412002-02-02 15:01:15 +0000678 if( !pPager->tempFile ){
679 rc = sqliteOsSync(&pPager->jfd);
680 if( rc!=0 ) return rc;
681 }
drh50e5dad2001-09-15 00:57:28 +0000682 pPager->needSync = 0;
683 }
684 for(pPg=pPager->pFirst; pPg; pPg=pPg->pNextFree){
685 if( pPg->dirty ){
drha7fcb052001-12-14 15:09:55 +0000686 sqliteOsSeek(&pPager->fd, (pPg->pgno-1)*SQLITE_PAGE_SIZE);
687 rc = sqliteOsWrite(&pPager->fd, PGHDR_TO_DATA(pPg), SQLITE_PAGE_SIZE);
drh50e5dad2001-09-15 00:57:28 +0000688 if( rc!=SQLITE_OK ) break;
689 pPg->dirty = 0;
690 }
691 }
drh81a20f22001-10-12 17:30:04 +0000692 return rc;
drh50e5dad2001-09-15 00:57:28 +0000693}
694
695/*
drhd9b02572001-04-15 00:37:09 +0000696** Acquire a page.
697**
drh58a11682001-11-10 13:51:08 +0000698** A read lock on the disk file is obtained when the first page is acquired.
drh5e00f6c2001-09-13 13:46:56 +0000699** This read lock is dropped when the last page is released.
drhd9b02572001-04-15 00:37:09 +0000700**
drh306dc212001-05-21 13:45:10 +0000701** A _get works for any page number greater than 0. If the database
702** file is smaller than the requested page, then no actual disk
703** read occurs and the memory image of the page is initialized to
704** all zeros. The extra data appended to a page is always initialized
705** to zeros the first time a page is loaded into memory.
706**
drhd9b02572001-04-15 00:37:09 +0000707** The acquisition might fail for several reasons. In all cases,
708** an appropriate error code is returned and *ppPage is set to NULL.
drh7e3b0a02001-04-28 16:52:40 +0000709**
710** See also sqlitepager_lookup(). Both this routine and _lookup() attempt
711** to find a page in the in-memory cache first. If the page is not already
drh5e00f6c2001-09-13 13:46:56 +0000712** in memory, this routine goes to disk to read it in whereas _lookup()
drh7e3b0a02001-04-28 16:52:40 +0000713** just returns 0. This routine acquires a read-lock the first time it
714** has to go to disk, and could also playback an old journal if necessary.
715** Since _lookup() never goes to disk, it never has to deal with locks
716** or journal files.
drhed7c8552001-04-11 14:29:21 +0000717*/
drhd9b02572001-04-15 00:37:09 +0000718int sqlitepager_get(Pager *pPager, Pgno pgno, void **ppPage){
drhed7c8552001-04-11 14:29:21 +0000719 PgHdr *pPg;
720
drhd9b02572001-04-15 00:37:09 +0000721 /* Make sure we have not hit any critical errors.
722 */
723 if( pPager==0 || pgno==0 ){
724 return SQLITE_ERROR;
725 }
726 if( pPager->errMask & ~(PAGER_ERR_FULL) ){
727 return pager_errcode(pPager);
728 }
729
drhed7c8552001-04-11 14:29:21 +0000730 /* If this is the first page accessed, then get a read lock
731 ** on the database file.
732 */
733 if( pPager->nRef==0 ){
drha7fcb052001-12-14 15:09:55 +0000734 if( sqliteOsReadLock(&pPager->fd)!=SQLITE_OK ){
drhed7c8552001-04-11 14:29:21 +0000735 *ppPage = 0;
736 return SQLITE_BUSY;
737 }
drhd9b02572001-04-15 00:37:09 +0000738 pPager->state = SQLITE_READLOCK;
drhed7c8552001-04-11 14:29:21 +0000739
740 /* If a journal file exists, try to play it back.
741 */
drh8cfbf082001-09-19 13:22:39 +0000742 if( sqliteOsFileExists(pPager->zJournal) ){
drhf57b3392001-10-08 13:22:32 +0000743 int rc, dummy;
drhed7c8552001-04-11 14:29:21 +0000744
drha7fcb052001-12-14 15:09:55 +0000745 /* Get a write lock on the database
746 */
747 rc = sqliteOsWriteLock(&pPager->fd);
748 if( rc!=SQLITE_OK ){
drh6446c4d2001-12-15 14:22:18 +0000749 rc = sqliteOsUnlock(&pPager->fd);
drha7fcb052001-12-14 15:09:55 +0000750 assert( rc==SQLITE_OK );
751 *ppPage = 0;
752 return SQLITE_BUSY;
753 }
754 pPager->state = SQLITE_WRITELOCK;
755
drhed7c8552001-04-11 14:29:21 +0000756 /* Open the journal for exclusive access. Return SQLITE_BUSY if
drhf57b3392001-10-08 13:22:32 +0000757 ** we cannot get exclusive access to the journal file.
758 **
759 ** Even though we will only be reading from the journal, not writing,
760 ** we have to open the journal for writing in order to obtain an
761 ** exclusive access lock.
drhed7c8552001-04-11 14:29:21 +0000762 */
drhf57b3392001-10-08 13:22:32 +0000763 rc = sqliteOsOpenReadWrite(pPager->zJournal, &pPager->jfd, &dummy);
drha7fcb052001-12-14 15:09:55 +0000764 if( rc!=SQLITE_OK ){
765 rc = sqliteOsUnlock(&pPager->fd);
766 assert( rc==SQLITE_OK );
drhed7c8552001-04-11 14:29:21 +0000767 *ppPage = 0;
768 return SQLITE_BUSY;
769 }
drha7fcb052001-12-14 15:09:55 +0000770 pPager->journalOpen = 1;
drhed7c8552001-04-11 14:29:21 +0000771
772 /* Playback and delete the journal. Drop the database write
773 ** lock and reacquire the read lock.
774 */
drhd9b02572001-04-15 00:37:09 +0000775 rc = pager_playback(pPager);
776 if( rc!=SQLITE_OK ){
777 return rc;
778 }
drhed7c8552001-04-11 14:29:21 +0000779 }
780 pPg = 0;
781 }else{
782 /* Search for page in cache */
drhd9b02572001-04-15 00:37:09 +0000783 pPg = pager_lookup(pPager, pgno);
drhed7c8552001-04-11 14:29:21 +0000784 }
785 if( pPg==0 ){
drhd9b02572001-04-15 00:37:09 +0000786 /* The requested page is not in the page cache. */
drhed7c8552001-04-11 14:29:21 +0000787 int h;
drh7e3b0a02001-04-28 16:52:40 +0000788 pPager->nMiss++;
drhed7c8552001-04-11 14:29:21 +0000789 if( pPager->nPage<pPager->mxPage || pPager->pFirst==0 ){
790 /* Create a new page */
drh7e3b0a02001-04-28 16:52:40 +0000791 pPg = sqliteMalloc( sizeof(*pPg) + SQLITE_PAGE_SIZE + pPager->nExtra );
drhd9b02572001-04-15 00:37:09 +0000792 if( pPg==0 ){
793 *ppPage = 0;
794 pager_unwritelock(pPager);
795 pPager->errMask |= PAGER_ERR_MEM;
796 return SQLITE_NOMEM;
797 }
drhed7c8552001-04-11 14:29:21 +0000798 pPg->pPager = pPager;
drhd9b02572001-04-15 00:37:09 +0000799 pPg->pNextAll = pPager->pAll;
800 if( pPager->pAll ){
801 pPager->pAll->pPrevAll = pPg;
802 }
803 pPg->pPrevAll = 0;
drhd79caeb2001-04-15 02:27:24 +0000804 pPager->pAll = pPg;
drhd9b02572001-04-15 00:37:09 +0000805 pPager->nPage++;
drhed7c8552001-04-11 14:29:21 +0000806 }else{
drhd9b02572001-04-15 00:37:09 +0000807 /* Recycle an older page. First locate the page to be recycled.
808 ** Try to find one that is not dirty and is near the head of
809 ** of the free list */
drhed7c8552001-04-11 14:29:21 +0000810 pPg = pPager->pFirst;
drh603240c2002-03-05 01:11:12 +0000811 while( pPg && pPg->dirty ){
drhd9b02572001-04-15 00:37:09 +0000812 pPg = pPg->pNextFree;
813 }
drhb19a2bc2001-09-16 00:13:26 +0000814
815 /* If we could not find a page that has not been used recently
816 ** and which is not dirty, then sync the journal and write all
817 ** dirty free pages into the database file, thus making them
818 ** clean pages and available for recycling.
819 **
820 ** We have to sync the journal before writing a page to the main
821 ** database. But syncing is a very slow operation. So after a
822 ** sync, it is best to write everything we can back to the main
823 ** database to minimize the risk of having to sync again in the
824 ** near future. That is way we write all dirty pages after a
825 ** sync.
826 */
drh603240c2002-03-05 01:11:12 +0000827 if( pPg==0 ){
drh50e5dad2001-09-15 00:57:28 +0000828 int rc = syncAllPages(pPager);
829 if( rc!=0 ){
830 sqlitepager_rollback(pPager);
831 *ppPage = 0;
832 return SQLITE_IOERR;
833 }
834 pPg = pPager->pFirst;
835 }
drhd9b02572001-04-15 00:37:09 +0000836 assert( pPg->nRef==0 );
drh50e5dad2001-09-15 00:57:28 +0000837 assert( pPg->dirty==0 );
drhd9b02572001-04-15 00:37:09 +0000838
839 /* Unlink the old page from the free list and the hash table
840 */
drh6019e162001-07-02 17:51:45 +0000841 if( pPg->pPrevFree ){
842 pPg->pPrevFree->pNextFree = pPg->pNextFree;
drhed7c8552001-04-11 14:29:21 +0000843 }else{
drh6019e162001-07-02 17:51:45 +0000844 assert( pPager->pFirst==pPg );
845 pPager->pFirst = pPg->pNextFree;
drhed7c8552001-04-11 14:29:21 +0000846 }
drh6019e162001-07-02 17:51:45 +0000847 if( pPg->pNextFree ){
848 pPg->pNextFree->pPrevFree = pPg->pPrevFree;
849 }else{
850 assert( pPager->pLast==pPg );
851 pPager->pLast = pPg->pPrevFree;
852 }
853 pPg->pNextFree = pPg->pPrevFree = 0;
drhed7c8552001-04-11 14:29:21 +0000854 if( pPg->pNextHash ){
855 pPg->pNextHash->pPrevHash = pPg->pPrevHash;
856 }
857 if( pPg->pPrevHash ){
858 pPg->pPrevHash->pNextHash = pPg->pNextHash;
859 }else{
drhd9b02572001-04-15 00:37:09 +0000860 h = pager_hash(pPg->pgno);
drhed7c8552001-04-11 14:29:21 +0000861 assert( pPager->aHash[h]==pPg );
862 pPager->aHash[h] = pPg->pNextHash;
863 }
drh6019e162001-07-02 17:51:45 +0000864 pPg->pNextHash = pPg->pPrevHash = 0;
drhd9b02572001-04-15 00:37:09 +0000865 pPager->nOvfl++;
drhed7c8552001-04-11 14:29:21 +0000866 }
867 pPg->pgno = pgno;
drh1ab43002002-01-14 09:28:19 +0000868 if( pPager->aInJournal && (int)pgno<=pPager->origDbSize ){
drh6019e162001-07-02 17:51:45 +0000869 pPg->inJournal = (pPager->aInJournal[pgno/8] & (1<<(pgno&7)))!=0;
870 }else{
871 pPg->inJournal = 0;
872 }
drh663fc632002-02-02 18:49:19 +0000873 if( pPager->aInCkpt && (int)pgno<=pPager->ckptSize ){
drhfa86c412002-02-02 15:01:15 +0000874 pPg->inCkpt = (pPager->aInCkpt[pgno/8] & (1<<(pgno&7)))!=0;
875 }else{
876 pPg->inCkpt = 0;
877 }
drhed7c8552001-04-11 14:29:21 +0000878 pPg->dirty = 0;
879 pPg->nRef = 1;
drhdd793422001-06-28 01:54:48 +0000880 REFINFO(pPg);
drhd9b02572001-04-15 00:37:09 +0000881 pPager->nRef++;
882 h = pager_hash(pgno);
drhed7c8552001-04-11 14:29:21 +0000883 pPg->pNextHash = pPager->aHash[h];
884 pPager->aHash[h] = pPg;
885 if( pPg->pNextHash ){
886 assert( pPg->pNextHash->pPrevHash==0 );
887 pPg->pNextHash->pPrevHash = pPg;
888 }
drh306dc212001-05-21 13:45:10 +0000889 if( pPager->dbSize<0 ) sqlitepager_pagecount(pPager);
drh1ab43002002-01-14 09:28:19 +0000890 if( pPager->dbSize<(int)pgno ){
drh306dc212001-05-21 13:45:10 +0000891 memset(PGHDR_TO_DATA(pPg), 0, SQLITE_PAGE_SIZE);
892 }else{
drh81a20f22001-10-12 17:30:04 +0000893 int rc;
drha7fcb052001-12-14 15:09:55 +0000894 sqliteOsSeek(&pPager->fd, (pgno-1)*SQLITE_PAGE_SIZE);
895 rc = sqliteOsRead(&pPager->fd, PGHDR_TO_DATA(pPg), SQLITE_PAGE_SIZE);
drh81a20f22001-10-12 17:30:04 +0000896 if( rc!=SQLITE_OK ){
897 return rc;
898 }
drh306dc212001-05-21 13:45:10 +0000899 }
drh7e3b0a02001-04-28 16:52:40 +0000900 if( pPager->nExtra>0 ){
901 memset(PGHDR_TO_EXTRA(pPg), 0, pPager->nExtra);
902 }
drhed7c8552001-04-11 14:29:21 +0000903 }else{
drhd9b02572001-04-15 00:37:09 +0000904 /* The requested page is in the page cache. */
drh7e3b0a02001-04-28 16:52:40 +0000905 pPager->nHit++;
drhdf0b3b02001-06-23 11:36:20 +0000906 page_ref(pPg);
drhed7c8552001-04-11 14:29:21 +0000907 }
908 *ppPage = PGHDR_TO_DATA(pPg);
909 return SQLITE_OK;
910}
911
912/*
drh7e3b0a02001-04-28 16:52:40 +0000913** Acquire a page if it is already in the in-memory cache. Do
914** not read the page from disk. Return a pointer to the page,
915** or 0 if the page is not in cache.
916**
917** See also sqlitepager_get(). The difference between this routine
918** and sqlitepager_get() is that _get() will go to the disk and read
919** in the page if the page is not already in cache. This routine
drh5e00f6c2001-09-13 13:46:56 +0000920** returns NULL if the page is not in cache or if a disk I/O error
921** has ever happened.
drh7e3b0a02001-04-28 16:52:40 +0000922*/
923void *sqlitepager_lookup(Pager *pPager, Pgno pgno){
924 PgHdr *pPg;
925
926 /* Make sure we have not hit any critical errors.
927 */
928 if( pPager==0 || pgno==0 ){
929 return 0;
930 }
931 if( pPager->errMask & ~(PAGER_ERR_FULL) ){
932 return 0;
933 }
934 if( pPager->nRef==0 ){
935 return 0;
936 }
937 pPg = pager_lookup(pPager, pgno);
938 if( pPg==0 ) return 0;
drhdf0b3b02001-06-23 11:36:20 +0000939 page_ref(pPg);
drh7e3b0a02001-04-28 16:52:40 +0000940 return PGHDR_TO_DATA(pPg);
941}
942
943/*
drhed7c8552001-04-11 14:29:21 +0000944** Release a page.
945**
946** If the number of references to the page drop to zero, then the
947** page is added to the LRU list. When all references to all pages
drhd9b02572001-04-15 00:37:09 +0000948** are released, a rollback occurs and the lock on the database is
drhed7c8552001-04-11 14:29:21 +0000949** removed.
950*/
drhd9b02572001-04-15 00:37:09 +0000951int sqlitepager_unref(void *pData){
drhed7c8552001-04-11 14:29:21 +0000952 PgHdr *pPg;
drhd9b02572001-04-15 00:37:09 +0000953
954 /* Decrement the reference count for this page
955 */
drhed7c8552001-04-11 14:29:21 +0000956 pPg = DATA_TO_PGHDR(pData);
957 assert( pPg->nRef>0 );
drhed7c8552001-04-11 14:29:21 +0000958 pPg->nRef--;
drhdd793422001-06-28 01:54:48 +0000959 REFINFO(pPg);
drhd9b02572001-04-15 00:37:09 +0000960
drh72f82862001-05-24 21:06:34 +0000961 /* When the number of references to a page reach 0, call the
962 ** destructor and add the page to the freelist.
drhd9b02572001-04-15 00:37:09 +0000963 */
drhed7c8552001-04-11 14:29:21 +0000964 if( pPg->nRef==0 ){
drh1eaa2692001-09-18 02:02:23 +0000965 Pager *pPager;
966 pPager = pPg->pPager;
drhd9b02572001-04-15 00:37:09 +0000967 pPg->pNextFree = 0;
968 pPg->pPrevFree = pPager->pLast;
drhed7c8552001-04-11 14:29:21 +0000969 pPager->pLast = pPg;
drhd9b02572001-04-15 00:37:09 +0000970 if( pPg->pPrevFree ){
971 pPg->pPrevFree->pNextFree = pPg;
drhed7c8552001-04-11 14:29:21 +0000972 }else{
973 pPager->pFirst = pPg;
974 }
drh72f82862001-05-24 21:06:34 +0000975 if( pPager->xDestructor ){
976 pPager->xDestructor(pData);
977 }
drhd9b02572001-04-15 00:37:09 +0000978
979 /* When all pages reach the freelist, drop the read lock from
980 ** the database file.
981 */
982 pPager->nRef--;
983 assert( pPager->nRef>=0 );
984 if( pPager->nRef==0 ){
985 pager_reset(pPager);
986 }
drhed7c8552001-04-11 14:29:21 +0000987 }
drhd9b02572001-04-15 00:37:09 +0000988 return SQLITE_OK;
drhed7c8552001-04-11 14:29:21 +0000989}
990
991/*
drh4b845d72002-03-05 12:41:19 +0000992** Acquire a write-lock on the database. The lock is removed when
993** the any of the following happen:
994**
995** * sqlitepager_commit() is called.
996** * sqlitepager_rollback() is called.
997** * sqlitepager_close() is called.
998** * sqlitepager_unref() is called to on every outstanding page.
999**
1000** The parameter to this routine is a pointer to any open page of the
1001** database file. Nothing changes about the page - it is used merely
1002** to acquire a pointer to the Pager structure and as proof that there
1003** is already a read-lock on the database.
1004**
1005** If the database is already write-locked, this routine is a no-op.
1006*/
1007int sqlitepager_begin(void *pData){
1008 PgHdr *pPg = DATA_TO_PGHDR(pData);
1009 Pager *pPager = pPg->pPager;
1010 int rc = SQLITE_OK;
1011 assert( pPg->nRef>0 );
1012 assert( pPager->state!=SQLITE_UNLOCK );
1013 if( pPager->state==SQLITE_READLOCK ){
1014 assert( pPager->aInJournal==0 );
1015 rc = sqliteOsWriteLock(&pPager->fd);
1016 if( rc!=SQLITE_OK ){
1017 return rc;
1018 }
1019 pPager->aInJournal = sqliteMalloc( pPager->dbSize/8 + 1 );
1020 if( pPager->aInJournal==0 ){
1021 sqliteOsReadLock(&pPager->fd);
1022 return SQLITE_NOMEM;
1023 }
1024 rc = sqliteOsOpenExclusive(pPager->zJournal, &pPager->jfd, 0);
1025 if( rc!=SQLITE_OK ){
1026 sqliteFree(pPager->aInJournal);
1027 pPager->aInJournal = 0;
1028 sqliteOsReadLock(&pPager->fd);
1029 return SQLITE_CANTOPEN;
1030 }
1031 pPager->journalOpen = 1;
1032 pPager->needSync = !pPager->noSync;
1033 pPager->state = SQLITE_WRITELOCK;
1034 sqlitepager_pagecount(pPager);
1035 pPager->origDbSize = pPager->dbSize;
1036 rc = sqliteOsWrite(&pPager->jfd, aJournalMagic, sizeof(aJournalMagic));
1037 if( rc==SQLITE_OK ){
1038 rc = sqliteOsWrite(&pPager->jfd, &pPager->dbSize, sizeof(Pgno));
1039 }
1040 if( rc!=SQLITE_OK ){
1041 rc = pager_unwritelock(pPager);
1042 if( rc==SQLITE_OK ) rc = SQLITE_FULL;
1043 }
1044 }
1045 return rc;
1046}
1047
1048/*
drhed7c8552001-04-11 14:29:21 +00001049** Mark a data page as writeable. The page is written into the journal
1050** if it is not there already. This routine must be called before making
1051** changes to a page.
1052**
1053** The first time this routine is called, the pager creates a new
1054** journal and acquires a write lock on the database. If the write
1055** lock could not be acquired, this routine returns SQLITE_BUSY. The
drh306dc212001-05-21 13:45:10 +00001056** calling routine must check for that return value and be careful not to
drhed7c8552001-04-11 14:29:21 +00001057** change any page data until this routine returns SQLITE_OK.
drhd9b02572001-04-15 00:37:09 +00001058**
1059** If the journal file could not be written because the disk is full,
1060** then this routine returns SQLITE_FULL and does an immediate rollback.
1061** All subsequent write attempts also return SQLITE_FULL until there
1062** is a call to sqlitepager_commit() or sqlitepager_rollback() to
1063** reset.
drhed7c8552001-04-11 14:29:21 +00001064*/
drhd9b02572001-04-15 00:37:09 +00001065int sqlitepager_write(void *pData){
drh69688d52001-04-14 16:38:23 +00001066 PgHdr *pPg = DATA_TO_PGHDR(pData);
1067 Pager *pPager = pPg->pPager;
drhd79caeb2001-04-15 02:27:24 +00001068 int rc = SQLITE_OK;
drh69688d52001-04-14 16:38:23 +00001069
drh6446c4d2001-12-15 14:22:18 +00001070 /* Check for errors
1071 */
drhd9b02572001-04-15 00:37:09 +00001072 if( pPager->errMask ){
1073 return pager_errcode(pPager);
1074 }
drh5e00f6c2001-09-13 13:46:56 +00001075 if( pPager->readOnly ){
1076 return SQLITE_PERM;
1077 }
drh6446c4d2001-12-15 14:22:18 +00001078
1079 /* Mark the page as dirty. If the page has already been written
1080 ** to the journal then we can return right away.
1081 */
drhd9b02572001-04-15 00:37:09 +00001082 pPg->dirty = 1;
drhfa86c412002-02-02 15:01:15 +00001083 if( pPg->inJournal && (pPg->inCkpt || pPager->ckptOpen==0) ){
1084 return SQLITE_OK;
1085 }
drh6446c4d2001-12-15 14:22:18 +00001086
1087 /* If we get this far, it means that the page needs to be
drhfa86c412002-02-02 15:01:15 +00001088 ** written to the transaction journal or the ckeckpoint journal
1089 ** or both.
1090 **
1091 ** First check to see that the transaction journal exists and
1092 ** create it if it does not.
drh6446c4d2001-12-15 14:22:18 +00001093 */
drhd9b02572001-04-15 00:37:09 +00001094 assert( pPager->state!=SQLITE_UNLOCK );
drh4b845d72002-03-05 12:41:19 +00001095 rc = sqlitepager_begin(pData);
1096 if( rc!=SQLITE_OK ) return rc;
drhd9b02572001-04-15 00:37:09 +00001097 assert( pPager->state==SQLITE_WRITELOCK );
drh8cfbf082001-09-19 13:22:39 +00001098 assert( pPager->journalOpen );
drh6446c4d2001-12-15 14:22:18 +00001099
drhfa86c412002-02-02 15:01:15 +00001100 /* The transaction journal now exists and we have a write lock on the
1101 ** main database file. Write the current page to the transaction
1102 ** journal if it is not there already.
drh6446c4d2001-12-15 14:22:18 +00001103 */
drhfa86c412002-02-02 15:01:15 +00001104 if( !pPg->inJournal && (int)pPg->pgno <= pPager->origDbSize ){
drha7fcb052001-12-14 15:09:55 +00001105 rc = sqliteOsWrite(&pPager->jfd, &pPg->pgno, sizeof(Pgno));
drhd9b02572001-04-15 00:37:09 +00001106 if( rc==SQLITE_OK ){
drha7fcb052001-12-14 15:09:55 +00001107 rc = sqliteOsWrite(&pPager->jfd, pData, SQLITE_PAGE_SIZE);
drhd9b02572001-04-15 00:37:09 +00001108 }
1109 if( rc!=SQLITE_OK ){
1110 sqlitepager_rollback(pPager);
1111 pPager->errMask |= PAGER_ERR_FULL;
1112 return rc;
1113 }
drh6019e162001-07-02 17:51:45 +00001114 assert( pPager->aInJournal!=0 );
1115 pPager->aInJournal[pPg->pgno/8] |= 1<<(pPg->pgno&7);
drh603240c2002-03-05 01:11:12 +00001116 pPager->needSync = !pPager->noSync;
drhfa86c412002-02-02 15:01:15 +00001117 pPg->inJournal = 1;
1118 if( pPager->ckptOpen ){
1119 pPager->aInCkpt[pPg->pgno/8] |= 1<<(pPg->pgno&7);
1120 pPg->inCkpt = 1;
1121 }
drh69688d52001-04-14 16:38:23 +00001122 }
drh6446c4d2001-12-15 14:22:18 +00001123
drhfa86c412002-02-02 15:01:15 +00001124 /* If the checkpoint journal is open and the page is not in it,
1125 ** then write the current page to the checkpoint journal.
drh6446c4d2001-12-15 14:22:18 +00001126 */
drh663fc632002-02-02 18:49:19 +00001127 if( pPager->ckptOpen && !pPg->inCkpt && (int)pPg->pgno<=pPager->ckptSize ){
drh1e336b42002-02-14 12:50:33 +00001128 assert( pPg->inJournal || (int)pPg->pgno>pPager->origDbSize );
drhfa86c412002-02-02 15:01:15 +00001129 rc = sqliteOsWrite(&pPager->cpfd, &pPg->pgno, sizeof(Pgno));
1130 if( rc==SQLITE_OK ){
1131 rc = sqliteOsWrite(&pPager->cpfd, pData, SQLITE_PAGE_SIZE);
1132 }
1133 if( rc!=SQLITE_OK ){
1134 sqlitepager_rollback(pPager);
1135 pPager->errMask |= PAGER_ERR_FULL;
1136 return rc;
1137 }
1138 assert( pPager->aInCkpt!=0 );
1139 pPager->aInCkpt[pPg->pgno/8] |= 1<<(pPg->pgno&7);
1140 pPg->inCkpt = 1;
1141 }
1142
1143 /* Update the database size and return.
1144 */
drh1ab43002002-01-14 09:28:19 +00001145 if( pPager->dbSize<(int)pPg->pgno ){
drh306dc212001-05-21 13:45:10 +00001146 pPager->dbSize = pPg->pgno;
1147 }
drh69688d52001-04-14 16:38:23 +00001148 return rc;
drhed7c8552001-04-11 14:29:21 +00001149}
1150
1151/*
drhaacc5432002-01-06 17:07:40 +00001152** Return TRUE if the page given in the argument was previously passed
drh6019e162001-07-02 17:51:45 +00001153** to sqlitepager_write(). In other words, return TRUE if it is ok
1154** to change the content of the page.
1155*/
1156int sqlitepager_iswriteable(void *pData){
1157 PgHdr *pPg = DATA_TO_PGHDR(pData);
1158 return pPg->dirty;
1159}
1160
1161/*
drh30e58752002-03-02 20:41:57 +00001162** A call to this routine tells the pager that it is not necessary to
1163** write the information on page "pgno" back to the disk, even though
1164** that page might be marked as dirty.
1165**
1166** The overlying software layer calls this routine when all of the data
1167** on the given page is unused. The pager marks the page as clean so
1168** that it does not get written to disk.
1169**
1170** Tests show that this optimization, together with the
1171** sqlitepager_dont_rollback() below, more than double the speed
1172** of large INSERT operations and quadruple the speed of large DELETEs.
1173*/
1174void sqlitepager_dont_write(Pager *pPager, Pgno pgno){
1175 PgHdr *pPg;
1176 pPg = pager_lookup(pPager, pgno);
1177 if( pPg && pPg->dirty ){
1178 pPg->dirty = 0;
1179 }
1180}
1181
1182/*
1183** A call to this routine tells the pager that if a rollback occurs,
1184** it is not necessary to restore the data on the given page. This
1185** means that the pager does not have to record the given page in the
1186** rollback journal.
1187*/
1188void sqlitepager_dont_rollback(void *pData){
1189 PgHdr *pPg = DATA_TO_PGHDR(pData);
1190 Pager *pPager = pPg->pPager;
1191
1192 if( pPager->state!=SQLITE_WRITELOCK || pPager->journalOpen==0 ) return;
1193 if( !pPg->inJournal && (int)pPg->pgno <= pPager->origDbSize ){
1194 assert( pPager->aInJournal!=0 );
1195 pPager->aInJournal[pPg->pgno/8] |= 1<<(pPg->pgno&7);
1196 pPg->inJournal = 1;
1197 if( pPager->ckptOpen ){
1198 pPager->aInCkpt[pPg->pgno/8] |= 1<<(pPg->pgno&7);
1199 pPg->inCkpt = 1;
1200 }
1201 }
1202 if( pPager->ckptOpen && !pPg->inCkpt && (int)pPg->pgno<=pPager->ckptSize ){
1203 assert( pPg->inJournal || (int)pPg->pgno>pPager->origDbSize );
1204 assert( pPager->aInCkpt!=0 );
1205 pPager->aInCkpt[pPg->pgno/8] |= 1<<(pPg->pgno&7);
1206 pPg->inCkpt = 1;
1207 }
1208}
1209
1210/*
drhed7c8552001-04-11 14:29:21 +00001211** Commit all changes to the database and release the write lock.
drhd9b02572001-04-15 00:37:09 +00001212**
1213** If the commit fails for any reason, a rollback attempt is made
1214** and an error code is returned. If the commit worked, SQLITE_OK
1215** is returned.
drhed7c8552001-04-11 14:29:21 +00001216*/
drhd9b02572001-04-15 00:37:09 +00001217int sqlitepager_commit(Pager *pPager){
drha1b351a2001-09-14 16:42:12 +00001218 int rc;
drhed7c8552001-04-11 14:29:21 +00001219 PgHdr *pPg;
drhd9b02572001-04-15 00:37:09 +00001220
1221 if( pPager->errMask==PAGER_ERR_FULL ){
1222 rc = sqlitepager_rollback(pPager);
1223 if( rc==SQLITE_OK ) rc = SQLITE_FULL;
1224 return rc;
1225 }
1226 if( pPager->errMask!=0 ){
1227 rc = pager_errcode(pPager);
1228 return rc;
1229 }
1230 if( pPager->state!=SQLITE_WRITELOCK ){
1231 return SQLITE_ERROR;
1232 }
drh8cfbf082001-09-19 13:22:39 +00001233 assert( pPager->journalOpen );
drha7fcb052001-12-14 15:09:55 +00001234 if( pPager->needSync && sqliteOsSync(&pPager->jfd)!=SQLITE_OK ){
drhd9b02572001-04-15 00:37:09 +00001235 goto commit_abort;
drhed7c8552001-04-11 14:29:21 +00001236 }
drha1b351a2001-09-14 16:42:12 +00001237 for(pPg=pPager->pAll; pPg; pPg=pPg->pNextAll){
1238 if( pPg->dirty==0 ) continue;
drha7fcb052001-12-14 15:09:55 +00001239 rc = sqliteOsSeek(&pPager->fd, (pPg->pgno-1)*SQLITE_PAGE_SIZE);
drha1b351a2001-09-14 16:42:12 +00001240 if( rc!=SQLITE_OK ) goto commit_abort;
drha7fcb052001-12-14 15:09:55 +00001241 rc = sqliteOsWrite(&pPager->fd, PGHDR_TO_DATA(pPg), SQLITE_PAGE_SIZE);
drha1b351a2001-09-14 16:42:12 +00001242 if( rc!=SQLITE_OK ) goto commit_abort;
drhed7c8552001-04-11 14:29:21 +00001243 }
drh603240c2002-03-05 01:11:12 +00001244 if( !pPager->noSync && sqliteOsSync(&pPager->fd)!=SQLITE_OK ){
1245 goto commit_abort;
1246 }
drhd9b02572001-04-15 00:37:09 +00001247 rc = pager_unwritelock(pPager);
1248 pPager->dbSize = -1;
1249 return rc;
1250
1251 /* Jump here if anything goes wrong during the commit process.
1252 */
1253commit_abort:
1254 rc = sqlitepager_rollback(pPager);
1255 if( rc==SQLITE_OK ){
1256 rc = SQLITE_FULL;
drhed7c8552001-04-11 14:29:21 +00001257 }
drhed7c8552001-04-11 14:29:21 +00001258 return rc;
1259}
1260
1261/*
1262** Rollback all changes. The database falls back to read-only mode.
1263** All in-memory cache pages revert to their original data contents.
1264** The journal is deleted.
drhd9b02572001-04-15 00:37:09 +00001265**
1266** This routine cannot fail unless some other process is not following
1267** the correct locking protocol (SQLITE_PROTOCOL) or unless some other
1268** process is writing trash into the journal file (SQLITE_CORRUPT) or
1269** unless a prior malloc() failed (SQLITE_NOMEM). Appropriate error
1270** codes are returned for all these occasions. Otherwise,
1271** SQLITE_OK is returned.
drhed7c8552001-04-11 14:29:21 +00001272*/
drhd9b02572001-04-15 00:37:09 +00001273int sqlitepager_rollback(Pager *pPager){
drhed7c8552001-04-11 14:29:21 +00001274 int rc;
drhd9b02572001-04-15 00:37:09 +00001275 if( pPager->errMask!=0 && pPager->errMask!=PAGER_ERR_FULL ){
drh4b845d72002-03-05 12:41:19 +00001276 if( pPager->state>=SQLITE_WRITELOCK ){
1277 pager_playback(pPager);
1278 }
drhd9b02572001-04-15 00:37:09 +00001279 return pager_errcode(pPager);
drhed7c8552001-04-11 14:29:21 +00001280 }
drhd9b02572001-04-15 00:37:09 +00001281 if( pPager->state!=SQLITE_WRITELOCK ){
1282 return SQLITE_OK;
1283 }
1284 rc = pager_playback(pPager);
1285 if( rc!=SQLITE_OK ){
1286 rc = SQLITE_CORRUPT;
1287 pPager->errMask |= PAGER_ERR_CORRUPT;
1288 }
1289 pPager->dbSize = -1;
drhed7c8552001-04-11 14:29:21 +00001290 return rc;
drh98808ba2001-10-18 12:34:46 +00001291}
drhd9b02572001-04-15 00:37:09 +00001292
1293/*
drh5e00f6c2001-09-13 13:46:56 +00001294** Return TRUE if the database file is opened read-only. Return FALSE
1295** if the database is (in theory) writable.
1296*/
1297int sqlitepager_isreadonly(Pager *pPager){
drhbe0072d2001-09-13 14:46:09 +00001298 return pPager->readOnly;
drh5e00f6c2001-09-13 13:46:56 +00001299}
1300
1301/*
drhd9b02572001-04-15 00:37:09 +00001302** This routine is used for testing and analysis only.
1303*/
1304int *sqlitepager_stats(Pager *pPager){
1305 static int a[9];
1306 a[0] = pPager->nRef;
1307 a[1] = pPager->nPage;
1308 a[2] = pPager->mxPage;
1309 a[3] = pPager->dbSize;
1310 a[4] = pPager->state;
1311 a[5] = pPager->errMask;
1312 a[6] = pPager->nHit;
1313 a[7] = pPager->nMiss;
1314 a[8] = pPager->nOvfl;
1315 return a;
1316}
drhdd793422001-06-28 01:54:48 +00001317
drhfa86c412002-02-02 15:01:15 +00001318/*
1319** Set the checkpoint.
1320**
1321** This routine should be called with the transaction journal already
1322** open. A new checkpoint journal is created that can be used to rollback
drhaaab5722002-02-19 13:39:21 +00001323** changes of a single SQL command within a larger transaction.
drhfa86c412002-02-02 15:01:15 +00001324*/
1325int sqlitepager_ckpt_begin(Pager *pPager){
1326 int rc;
1327 char zTemp[SQLITE_TEMPNAME_SIZE];
1328 assert( pPager->journalOpen );
1329 assert( !pPager->ckptOpen );
1330 pPager->aInCkpt = sqliteMalloc( pPager->dbSize/8 + 1 );
1331 if( pPager->aInCkpt==0 ){
1332 sqliteOsReadLock(&pPager->fd);
1333 return SQLITE_NOMEM;
1334 }
1335 rc = sqliteOsFileSize(&pPager->jfd, &pPager->ckptJSize);
1336 if( rc ) goto ckpt_begin_failed;
drh663fc632002-02-02 18:49:19 +00001337 pPager->ckptSize = pPager->dbSize;
drhfa86c412002-02-02 15:01:15 +00001338 rc = sqlitepager_opentemp(zTemp, &pPager->cpfd);
1339 if( rc ) goto ckpt_begin_failed;
1340 pPager->ckptOpen = 1;
1341 return SQLITE_OK;
1342
1343ckpt_begin_failed:
1344 if( pPager->aInCkpt ){
1345 sqliteFree(pPager->aInCkpt);
1346 pPager->aInCkpt = 0;
1347 }
1348 return rc;
1349}
1350
1351/*
1352** Commit a checkpoint.
1353*/
1354int sqlitepager_ckpt_commit(Pager *pPager){
drh663fc632002-02-02 18:49:19 +00001355 if( pPager->ckptOpen ){
1356 PgHdr *pPg;
1357 sqliteOsClose(&pPager->cpfd);
1358 pPager->ckptOpen = 0;
1359 sqliteFree( pPager->aInCkpt );
1360 pPager->aInCkpt = 0;
1361 for(pPg=pPager->pAll; pPg; pPg=pPg->pNextAll){
1362 pPg->inCkpt = 0;
1363 }
1364 }
drhfa86c412002-02-02 15:01:15 +00001365 return SQLITE_OK;
1366}
1367
1368/*
1369** Rollback a checkpoint.
1370*/
1371int sqlitepager_ckpt_rollback(Pager *pPager){
1372 int rc;
drh663fc632002-02-02 18:49:19 +00001373 if( pPager->ckptOpen ){
1374 rc = pager_ckpt_playback(pPager);
1375 sqlitepager_ckpt_commit(pPager);
1376 }else{
1377 rc = SQLITE_OK;
1378 }
drhfa86c412002-02-02 15:01:15 +00001379 return rc;
1380}
1381
drhdd793422001-06-28 01:54:48 +00001382#if SQLITE_TEST
1383/*
1384** Print a listing of all referenced pages and their ref count.
1385*/
1386void sqlitepager_refdump(Pager *pPager){
1387 PgHdr *pPg;
1388 for(pPg=pPager->pAll; pPg; pPg=pPg->pNextAll){
1389 if( pPg->nRef<=0 ) continue;
1390 printf("PAGE %3d addr=0x%08x nRef=%d\n",
1391 pPg->pgno, (int)PGHDR_TO_DATA(pPg), pPg->nRef);
1392 }
1393}
1394#endif