Blame - src/os_unix.c - chromium.googlesource.com/chromium/deps/sqlite

blob: 2fff26852d480d3d2a67841905128351473169e1 [file] [log] [blame]

drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1	/*
				2	** 2004 May 22
				3	**
				4	** The author disclaims copyright to this source code. In place of
				5	** a legal notice, here is a blessing:
				6	**
				7	** May you do good and not evil.
				8	** May you find forgiveness for yourself and forgive others.
				9	** May you share freely, never taking more than you give.
				10	**
				11	******************************************************************************
				12	**
				13	** This file contains code that is specific to Unix systems.
				14	*/
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	15	#include "sqliteInt.h"
drh	eb20625	2004-10-01 02:00:31 +0000	[diff] [blame]	16	#include "os.h"
				17	#if OS_UNIX /* This file is used on unix only */
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	18
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	19	/* #define SQLITE_ENABLE_LOCKING_STYLE 0 */
				20
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	21	/*
				22	** These #defines should enable >2GB file support on Posix if the
				23	** underlying operating system supports it. If the OS lacks
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	24	** large file support, these should be no-ops.
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	25	**
				26	** Large file support can be disabled using the -DSQLITE_DISABLE_LFS switch
				27	** on the compiler command line. This is necessary if you are compiling
				28	** on a recent machine (ex: RedHat 7.2) but you want your code to work
				29	** on an older machine (ex: RedHat 6.0). If you compile on RedHat 7.2
				30	** without this option, LFS is enable. But LFS does not exist in the kernel
				31	** in RedHat 6.0, so the code won't work. Hence, for maximum binary
				32	** portability you should omit LFS.
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	33	*/
				34	#ifndef SQLITE_DISABLE_LFS
				35	# define _LARGE_FILE 1
				36	# ifndef _FILE_OFFSET_BITS
				37	# define _FILE_OFFSET_BITS 64
				38	# endif
				39	# define _LARGEFILE_SOURCE 1
				40	#endif
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	41
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	42	/*
				43	** standard include files.
				44	*/
				45	#include <sys/types.h>
				46	#include <sys/stat.h>
				47	#include <fcntl.h>
				48	#include <unistd.h>
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	49	#include <time.h>
drh	19e2d37	2005-08-29 23:00:03 +0000	[diff] [blame]	50	#include <sys/time.h>
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	51	#include <errno.h>
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	52	#ifdef SQLITE_ENABLE_LOCKING_STYLE
				53	#include <sys/ioctl.h>
				54	#include <sys/param.h>
				55	#include <sys/mount.h>
				56	#endif /* SQLITE_ENABLE_LOCKING_STYLE */
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	57
				58	/*
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	59	** If we are to be thread-safe, include the pthreads header and define
				60	** the SQLITE_UNIX_THREADS macro.
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	61	*/
drh	2c547df	2007-04-01 18:46:19 +0000	[diff] [blame]	62	#ifndef THREADSAFE
				63	# define THREADSAFE 1
				64	#endif
				65	#if THREADSAFE
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	66	# include <pthread.h>
				67	# define SQLITE_UNIX_THREADS 1
				68	#endif
				69
				70	/*
				71	** Default permissions when creating a new file
				72	*/
				73	#ifndef SQLITE_DEFAULT_FILE_PERMISSIONS
				74	# define SQLITE_DEFAULT_FILE_PERMISSIONS 0644
				75	#endif
				76
				77
				78
				79	/*
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	80	** The unixFile structure is subclass of OsFile specific for the unix
				81	** protability layer.
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	82	*/
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	83	typedef struct unixFile unixFile;
				84	struct unixFile {
				85	IoMethod const pMethod; / Always the first entry */
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	86	struct openCnt pOpen; / Info about all open fd's on this inode */
				87	struct lockInfo pLock; / Info about locks on this inode */
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	88	#ifdef SQLITE_ENABLE_LOCKING_STYLE
				89	void lockingContext; / Locking style specific state */
				90	#endif /* SQLITE_ENABLE_LOCKING_STYLE */
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	91	int h; /* The file descriptor */
				92	unsigned char locktype; /* The type of lock held on this fd */
				93	unsigned char isOpen; /* True if needs to be closed */
				94	unsigned char fullSync; /* Use F_FULLSYNC if available */
				95	int dirfd; /* File descriptor for the directory */
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	96	i64 offset; /* Seek offset */
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	97	#ifdef SQLITE_UNIX_THREADS
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	98	pthread_t tid; /* The thread that "owns" this OsFile */
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	99	#endif
				100	};
				101
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	102	/*
				103	** Provide the ability to override some OS-layer functions during
				104	** testing. This is used to simulate OS crashes to verify that
				105	** commits are atomic even in the event of an OS crash.
				106	*/
				107	#ifdef SQLITE_CRASH_TEST
				108	extern int sqlite3CrashTestEnable;
				109	extern int sqlite3CrashOpenReadWrite(const char, OsFile, int);
				110	extern int sqlite3CrashOpenExclusive(const char, OsFile*, int);
				111	extern int sqlite3CrashOpenReadOnly(const char, OsFile*, int);
				112	# define CRASH_TEST_OVERRIDE(X,A,B,C) \
				113	if(sqlite3CrashTestEnable){ return X(A,B,C); }
				114	#else
				115	# define CRASH_TEST_OVERRIDE(X,A,B,C) /* no-op */
				116	#endif
				117
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	118
				119	/*
drh	198bf39	2006-01-06 21:52:49 +0000	[diff] [blame]	120	** Include code that is common to all os_*.c files
				121	*/
				122	#include "os_common.h"
				123
				124	/*
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	125	** Do not include any of the File I/O interface procedures if the
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	126	** SQLITE_OMIT_DISKIO macro is defined (indicating that the database
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	127	** will be in-memory only)
				128	*/
				129	#ifndef SQLITE_OMIT_DISKIO
				130
				131
				132	/*
				133	** Define various macros that are missing from some systems.
				134	*/
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	135	#ifndef O_LARGEFILE
				136	# define O_LARGEFILE 0
				137	#endif
				138	#ifdef SQLITE_DISABLE_LFS
				139	# undef O_LARGEFILE
				140	# define O_LARGEFILE 0
				141	#endif
				142	#ifndef O_NOFOLLOW
				143	# define O_NOFOLLOW 0
				144	#endif
				145	#ifndef O_BINARY
				146	# define O_BINARY 0
				147	#endif
				148
				149	/*
				150	** The DJGPP compiler environment looks mostly like Unix, but it
				151	** lacks the fcntl() system call. So redefine fcntl() to be something
				152	** that always succeeds. This means that locking does not occur under
danielk1977	26c5d79	2005-11-25 09:01:23 +0000	[diff] [blame]	153	** DJGPP. But it's DOS - what did you expect?
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	154	*/
				155	#ifdef __DJGPP__
				156	# define fcntl(A,B,C) 0
				157	#endif
				158
				159	/*
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	160	** The threadid macro resolves to the thread-id or to 0. Used for
				161	** testing and debugging only.
				162	*/
				163	#ifdef SQLITE_UNIX_THREADS
				164	#define threadid pthread_self()
				165	#else
				166	#define threadid 0
				167	#endif
				168
				169	/*
				170	** Set or check the OsFile.tid field. This field is set when an OsFile
				171	** is first opened. All subsequent uses of the OsFile verify that the
				172	** same thread is operating on the OsFile. Some operating systems do
				173	** not allow locks to be overridden by other threads and that restriction
				174	** means that sqlite3* database handles cannot be moved from one thread
				175	** to another. This logic makes sure a user does not try to do that
				176	** by mistake.
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	177	**
				178	** Version 3.3.1 (2006-01-15): OsFiles can be moved from one thread to
				179	** another as long as we are running on a system that supports threads
				180	** overriding each others locks (which now the most common behavior)
				181	** or if no locks are held. But the OsFile.pLock field needs to be
				182	** recomputed because its key includes the thread-id. See the
				183	** transferOwnership() function below for additional information
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	184	*/
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	185	#if defined(SQLITE_UNIX_THREADS)
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	186	# define SET_THREADID(X) (X)->tid = pthread_self()
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	187	# define CHECK_THREADID(X) (threadsOverrideEachOthersLocks==0 && \
				188	!pthread_equal((X)->tid, pthread_self()))
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	189	#else
				190	# define SET_THREADID(X)
				191	# define CHECK_THREADID(X) 0
danielk1977	13adf8a	2004-06-03 16:08:41 +0000	[diff] [blame]	192	#endif
				193
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	194	/*
				195	** Here is the dirt on POSIX advisory locks: ANSI STD 1003.1 (1996)
				196	** section 6.5.2.2 lines 483 through 490 specify that when a process
				197	** sets or clears a lock, that operation overrides any prior locks set
				198	** by the same process. It does not explicitly say so, but this implies
				199	** that it overrides locks set by the same process using a different
				200	** file descriptor. Consider this test case:
				201	**
				202	** int fd1 = open("./file1", O_RDWR\|O_CREAT, 0644);
				203	** int fd2 = open("./file2", O_RDWR\|O_CREAT, 0644);
				204	**
				205	** Suppose ./file1 and ./file2 are really the same file (because
				206	** one is a hard or symbolic link to the other) then if you set
				207	** an exclusive lock on fd1, then try to get an exclusive lock
				208	** on fd2, it works. I would have expected the second lock to
				209	** fail since there was already a lock on the file due to fd1.
				210	** But not so. Since both locks came from the same process, the
				211	** second overrides the first, even though they were on different
				212	** file descriptors opened on different file names.
				213	**
				214	** Bummer. If you ask me, this is broken. Badly broken. It means
				215	** that we cannot use POSIX locks to synchronize file access among
				216	** competing threads of the same process. POSIX locks will work fine
				217	** to synchronize access for threads in separate processes, but not
				218	** threads within the same process.
				219	**
				220	** To work around the problem, SQLite has to manage file locks internally
				221	** on its own. Whenever a new database is opened, we have to find the
				222	** specific inode of the database file (the inode is determined by the
				223	** st_dev and st_ino fields of the stat structure that fstat() fills in)
				224	** and check for locks already existing on that inode. When locks are
				225	** created or removed, we have to look at our own internal record of the
				226	** locks to see if another thread has previously set a lock on that same
				227	** inode.
				228	**
				229	** The OsFile structure for POSIX is no longer just an integer file
				230	** descriptor. It is now a structure that holds the integer file
				231	** descriptor and a pointer to a structure that describes the internal
				232	** locks on the corresponding inode. There is one locking structure
				233	** per inode, so if the same inode is opened twice, both OsFile structures
				234	** point to the same locking structure. The locking structure keeps
				235	** a reference count (so we will know when to delete it) and a "cnt"
				236	** field that tells us its internal lock status. cnt==0 means the
				237	** file is unlocked. cnt==-1 means the file has an exclusive lock.
				238	** cnt>0 means there are cnt shared locks on the file.
				239	**
				240	** Any attempt to lock or unlock a file first checks the locking
				241	** structure. The fcntl() system call is only invoked to set a
				242	** POSIX lock if the internal lock structure transitions between
				243	** a locked and an unlocked state.
				244	**
				245	** 2004-Jan-11:
				246	** More recent discoveries about POSIX advisory locks. (The more
				247	** I discover, the more I realize the a POSIX advisory locks are
				248	** an abomination.)
				249	**
				250	** If you close a file descriptor that points to a file that has locks,
				251	** all locks on that file that are owned by the current process are
				252	** released. To work around this problem, each OsFile structure contains
				253	** a pointer to an openCnt structure. There is one openCnt structure
				254	** per open inode, which means that multiple OsFiles can point to a single
				255	** openCnt. When an attempt is made to close an OsFile, if there are
				256	** other OsFiles open on the same inode that are holding locks, the call
				257	** to close() the file descriptor is deferred until all of the locks clear.
				258	** The openCnt structure keeps a list of file descriptors that need to
				259	** be closed and that list is walked (and cleared) when the last lock
				260	** clears.
				261	**
				262	** First, under Linux threads, because each thread has a separate
				263	** process ID, lock operations in one thread do not override locks
				264	** to the same file in other threads. Linux threads behave like
				265	** separate processes in this respect. But, if you close a file
				266	** descriptor in linux threads, all locks are cleared, even locks
				267	** on other threads and even though the other threads have different
				268	** process IDs. Linux threads is inconsistent in this respect.
				269	** (I'm beginning to think that linux threads is an abomination too.)
				270	** The consequence of this all is that the hash table for the lockInfo
				271	** structure has to include the process id as part of its key because
				272	** locks in different threads are treated as distinct. But the
				273	** openCnt structure should not include the process id in its
				274	** key because close() clears lock on all threads, not just the current
				275	** thread. Were it not for this goofiness in linux threads, we could
				276	** combine the lockInfo and openCnt structures into a single structure.
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	277	**
				278	** 2004-Jun-28:
				279	** On some versions of linux, threads can override each others locks.
				280	** On others not. Sometimes you can change the behavior on the same
				281	** system by setting the LD_ASSUME_KERNEL environment variable. The
				282	** POSIX standard is silent as to which behavior is correct, as far
				283	** as I can tell, so other versions of unix might show the same
				284	** inconsistency. There is no little doubt in my mind that posix
				285	** advisory locks and linux threads are profoundly broken.
				286	**
				287	** To work around the inconsistencies, we have to test at runtime
				288	** whether or not threads can override each others locks. This test
				289	** is run once, the first time any lock is attempted. A static
				290	** variable is set to record the results of this test for future
				291	** use.
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	292	*/
				293
				294	/*
				295	** An instance of the following structure serves as the key used
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	296	** to locate a particular lockInfo structure given its inode.
				297	**
				298	** If threads cannot override each others locks, then we set the
				299	** lockKey.tid field to the thread ID. If threads can override
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	300	** each others locks then tid is always set to zero. tid is omitted
				301	** if we compile without threading support.
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	302	*/
				303	struct lockKey {
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	304	dev_t dev; /* Device number */
				305	ino_t ino; /* Inode number */
				306	#ifdef SQLITE_UNIX_THREADS
drh	d9cb6ac	2005-10-20 07:28:17 +0000	[diff] [blame]	307	pthread_t tid; /* Thread ID or zero if threads can override each other */
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	308	#endif
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	309	};
				310
				311	/*
				312	** An instance of the following structure is allocated for each open
				313	** inode on each thread with a different process ID. (Threads have
				314	** different process IDs on linux, but not on most other unixes.)
				315	**
				316	** A single inode can have multiple file descriptors, so each OsFile
				317	** structure contains a pointer to an instance of this object and this
				318	** object keeps a count of the number of OsFiles pointing to it.
				319	*/
				320	struct lockInfo {
				321	struct lockKey key; /* The lookup key */
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	322	int cnt; /* Number of SHARED locks held */
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	323	int locktype; /* One of SHARED_LOCK, RESERVED_LOCK etc. */
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	324	int nRef; /* Number of pointers to this structure */
				325	};
				326
				327	/*
				328	** An instance of the following structure serves as the key used
				329	** to locate a particular openCnt structure given its inode. This
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	330	** is the same as the lockKey except that the thread ID is omitted.
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	331	*/
				332	struct openKey {
				333	dev_t dev; /* Device number */
				334	ino_t ino; /* Inode number */
				335	};
				336
				337	/*
				338	** An instance of the following structure is allocated for each open
				339	** inode. This structure keeps track of the number of locks on that
				340	** inode. If a close is attempted against an inode that is holding
				341	** locks, the close is deferred until all locks clear by adding the
				342	** file descriptor to be closed to the pending list.
				343	*/
				344	struct openCnt {
				345	struct openKey key; /* The lookup key */
				346	int nRef; /* Number of pointers to this structure */
				347	int nLock; /* Number of outstanding locks */
				348	int nPending; /* Number of pending close() operations */
				349	int aPending; / Malloced space holding fd's awaiting a close() */
				350	};
				351
				352	/*
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	353	** These hash tables map inodes and file descriptors (really, lockKey and
				354	** openKey structures) into lockInfo and openCnt structures. Access to
				355	** these hash tables must be protected by a mutex.
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	356	*/
danielk1977	750b03e	2006-02-14 10:48:39 +0000	[diff] [blame]	357	static Hash lockHash = {SQLITE_HASH_BINARY, 0, 0, 0,
				358	sqlite3ThreadSafeMalloc, sqlite3ThreadSafeFree, 0, 0};
				359	static Hash openHash = {SQLITE_HASH_BINARY, 0, 0, 0,
				360	sqlite3ThreadSafeMalloc, sqlite3ThreadSafeFree, 0, 0};
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	361
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	362	#ifdef SQLITE_ENABLE_LOCKING_STYLE
				363	/*
				364	** The locking styles are associated with the different file locking
				365	** capabilities supported by different file systems.
				366	**
				367	** POSIX locking style fully supports shared and exclusive byte-range locks
				368	** ADP locking only supports exclusive byte-range locks
				369	** FLOCK only supports a single file-global exclusive lock
				370	** DOTLOCK isn't a true locking style, it refers to the use of a special
				371	** file named the same as the database file with a '.lock' extension, this
				372	** can be used on file systems that do not offer any reliable file locking
				373	** NO locking means that no locking will be attempted, this is only used for
				374	** read-only file systems currently
				375	** UNSUPPORTED means that no locking will be attempted, this is only used for
				376	** file systems that are known to be unsupported
				377	*/
				378	typedef enum {
				379	posixLockingStyle = 0, /* standard posix-advisory locks */
				380	afpLockingStyle, /* use afp locks */
				381	flockLockingStyle, /* use flock() */
				382	dotlockLockingStyle, /* use <file>.lock files */
				383	noLockingStyle, /* useful for read-only file system */
				384	unsupportedLockingStyle /* indicates unsupported file system */
				385	} sqlite3LockingStyle;
				386	#endif /* SQLITE_ENABLE_LOCKING_STYLE */
				387
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	388	#ifdef SQLITE_UNIX_THREADS
				389	/*
				390	** This variable records whether or not threads can override each others
				391	** locks.
				392	**
				393	** 0: No. Threads cannot override each others locks.
				394	** 1: Yes. Threads can override each others locks.
				395	** -1: We don't know yet.
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	396	**
drh	5062d3a	2006-01-31 23:03:35 +0000	[diff] [blame]	397	** On some systems, we know at compile-time if threads can override each
				398	** others locks. On those systems, the SQLITE_THREAD_OVERRIDE_LOCK macro
				399	** will be set appropriately. On other systems, we have to check at
				400	** runtime. On these latter systems, SQLTIE_THREAD_OVERRIDE_LOCK is
				401	** undefined.
				402	**
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	403	** This variable normally has file scope only. But during testing, we make
				404	** it a global so that the test code can change its value in order to verify
				405	** that the right stuff happens in either case.
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	406	*/
drh	5062d3a	2006-01-31 23:03:35 +0000	[diff] [blame]	407	#ifndef SQLITE_THREAD_OVERRIDE_LOCK
				408	# define SQLITE_THREAD_OVERRIDE_LOCK -1
				409	#endif
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	410	#ifdef SQLITE_TEST
drh	5062d3a	2006-01-31 23:03:35 +0000	[diff] [blame]	411	int threadsOverrideEachOthersLocks = SQLITE_THREAD_OVERRIDE_LOCK;
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	412	#else
drh	5062d3a	2006-01-31 23:03:35 +0000	[diff] [blame]	413	static int threadsOverrideEachOthersLocks = SQLITE_THREAD_OVERRIDE_LOCK;
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	414	#endif
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	415
				416	/*
				417	** This structure holds information passed into individual test
				418	** threads by the testThreadLockingBehavior() routine.
				419	*/
				420	struct threadTestData {
				421	int fd; /* File to be locked */
				422	struct flock lock; /* The locking operation */
				423	int result; /* Result of the locking operation */
				424	};
				425
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	426	#ifdef SQLITE_LOCK_TRACE
				427	/*
				428	** Print out information about all locking operations.
				429	**
				430	** This routine is used for troubleshooting locks on multithreaded
				431	** platforms. Enable by compiling with the -DSQLITE_LOCK_TRACE
				432	** command-line option on the compiler. This code is normally
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	433	** turned off.
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	434	*/
				435	static int lockTrace(int fd, int op, struct flock *p){
				436	char zOpName, zType;
				437	int s;
				438	int savedErrno;
				439	if( op==F_GETLK ){
				440	zOpName = "GETLK";
				441	}else if( op==F_SETLK ){
				442	zOpName = "SETLK";
				443	}else{
				444	s = fcntl(fd, op, p);
				445	sqlite3DebugPrintf("fcntl unknown %d %d %d\n", fd, op, s);
				446	return s;
				447	}
				448	if( p->l_type==F_RDLCK ){
				449	zType = "RDLCK";
				450	}else if( p->l_type==F_WRLCK ){
				451	zType = "WRLCK";
				452	}else if( p->l_type==F_UNLCK ){
				453	zType = "UNLCK";
				454	}else{
				455	assert( 0 );
				456	}
				457	assert( p->l_whence==SEEK_SET );
				458	s = fcntl(fd, op, p);
				459	savedErrno = errno;
				460	sqlite3DebugPrintf("fcntl %d %d %s %s %d %d %d %d\n",
				461	threadid, fd, zOpName, zType, (int)p->l_start, (int)p->l_len,
				462	(int)p->l_pid, s);
drh	e2396a1	2007-03-29 20:19:58 +0000	[diff] [blame]	463	if( s==(-1) && op==F_SETLK && (p->l_type==F_RDLCK \|\| p->l_type==F_WRLCK) ){
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	464	struct flock l2;
				465	l2 = *p;
				466	fcntl(fd, F_GETLK, &l2);
				467	if( l2.l_type==F_RDLCK ){
				468	zType = "RDLCK";
				469	}else if( l2.l_type==F_WRLCK ){
				470	zType = "WRLCK";
				471	}else if( l2.l_type==F_UNLCK ){
				472	zType = "UNLCK";
				473	}else{
				474	assert( 0 );
				475	}
				476	sqlite3DebugPrintf("fcntl-failure-reason: %s %d %d %d\n",
				477	zType, (int)l2.l_start, (int)l2.l_len, (int)l2.l_pid);
				478	}
				479	errno = savedErrno;
				480	return s;
				481	}
				482	#define fcntl lockTrace
				483	#endif /* SQLITE_LOCK_TRACE */
				484
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	485	/*
				486	** The testThreadLockingBehavior() routine launches two separate
				487	** threads on this routine. This routine attempts to lock a file
				488	** descriptor then returns. The success or failure of that attempt
				489	** allows the testThreadLockingBehavior() procedure to determine
				490	** whether or not threads can override each others locks.
				491	*/
				492	static void threadLockingTest(void pArg){
				493	struct threadTestData pData = (struct threadTestData)pArg;
				494	pData->result = fcntl(pData->fd, F_SETLK, &pData->lock);
				495	return pArg;
				496	}
				497
				498	/*
				499	** This procedure attempts to determine whether or not threads
				500	** can override each others locks then sets the
				501	** threadsOverrideEachOthersLocks variable appropriately.
				502	*/
danielk1977	4d5238f	2006-01-27 06:32:00 +0000	[diff] [blame]	503	static void testThreadLockingBehavior(int fd_orig){
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	504	int fd;
				505	struct threadTestData d[2];
				506	pthread_t t[2];
				507
				508	fd = dup(fd_orig);
				509	if( fd<0 ) return;
				510	memset(d, 0, sizeof(d));
				511	d[0].fd = fd;
				512	d[0].lock.l_type = F_RDLCK;
				513	d[0].lock.l_len = 1;
				514	d[0].lock.l_start = 0;
				515	d[0].lock.l_whence = SEEK_SET;
				516	d[1] = d[0];
				517	d[1].lock.l_type = F_WRLCK;
				518	pthread_create(&t[0], 0, threadLockingTest, &d[0]);
				519	pthread_create(&t[1], 0, threadLockingTest, &d[1]);
				520	pthread_join(t[0], 0);
				521	pthread_join(t[1], 0);
				522	close(fd);
				523	threadsOverrideEachOthersLocks = d[0].result==0 && d[1].result==0;
				524	}
				525	#endif /* SQLITE_UNIX_THREADS */
				526
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	527	/*
				528	** Release a lockInfo structure previously allocated by findLockInfo().
				529	*/
				530	static void releaseLockInfo(struct lockInfo *pLock){
drh	757b04e	2006-01-18 17:25:45 +0000	[diff] [blame]	531	assert( sqlite3OsInMutex(1) );
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	532	if (pLock == NULL)
				533	return;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	534	pLock->nRef--;
				535	if( pLock->nRef==0 ){
				536	sqlite3HashInsert(&lockHash, &pLock->key, sizeof(pLock->key), 0);
danielk1977	750b03e	2006-02-14 10:48:39 +0000	[diff] [blame]	537	sqlite3ThreadSafeFree(pLock);
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	538	}
				539	}
				540
				541	/*
				542	** Release a openCnt structure previously allocated by findLockInfo().
				543	*/
				544	static void releaseOpenCnt(struct openCnt *pOpen){
drh	757b04e	2006-01-18 17:25:45 +0000	[diff] [blame]	545	assert( sqlite3OsInMutex(1) );
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	546	if (pOpen == NULL)
				547	return;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	548	pOpen->nRef--;
				549	if( pOpen->nRef==0 ){
				550	sqlite3HashInsert(&openHash, &pOpen->key, sizeof(pOpen->key), 0);
drh	64b1bea	2006-01-15 02:30:57 +0000	[diff] [blame]	551	free(pOpen->aPending);
danielk1977	750b03e	2006-02-14 10:48:39 +0000	[diff] [blame]	552	sqlite3ThreadSafeFree(pOpen);
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	553	}
				554	}
				555
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	556	#ifdef SQLITE_ENABLE_LOCKING_STYLE
				557	/*
				558	** Tests a byte-range locking query to see if byte range locks are
				559	** supported, if not we fall back to dotlockLockingStyle.
				560	*/
				561	static sqlite3LockingStyle sqlite3TestLockingStyle(const char *filePath,
				562	int fd) {
				563	/* test byte-range lock using fcntl */
				564	struct flock lockInfo;
				565
				566	lockInfo.l_len = 1;
				567	lockInfo.l_start = 0;
				568	lockInfo.l_whence = SEEK_SET;
				569	lockInfo.l_type = F_RDLCK;
				570
aswift	ae0943b	2007-01-31 23:37:07 +0000	[diff] [blame]	571	if (fcntl(fd, F_GETLK, &lockInfo) != -1) {
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	572	return posixLockingStyle;
				573	}
				574
				575	/* testing for flock can give false positives. So if if the above test
				576	** fails, then we fall back to using dot-lock style locking.
				577	*/
				578	return dotlockLockingStyle;
				579	}
				580
				581	/*
				582	** Examines the f_fstypename entry in the statfs structure as returned by
				583	** stat() for the file system hosting the database file, assigns the
				584	** appropriate locking style based on it's value. These values and
				585	** assignments are based on Darwin/OSX behavior and have not been tested on
				586	** other systems.
				587	*/
				588	static sqlite3LockingStyle sqlite3DetectLockingStyle(const char *filePath,
				589	int fd) {
				590
				591	#ifdef SQLITE_FIXED_LOCKING_STYLE
				592	return (sqlite3LockingStyle)SQLITE_FIXED_LOCKING_STYLE;
				593	#else
				594	struct statfs fsInfo;
				595
				596	if (statfs(filePath, &fsInfo) == -1)
				597	return sqlite3TestLockingStyle(filePath, fd);
				598
				599	if (fsInfo.f_flags & MNT_RDONLY)
				600	return noLockingStyle;
				601
				602	if( (!strcmp(fsInfo.f_fstypename, "hfs")) \|\|
				603	(!strcmp(fsInfo.f_fstypename, "ufs")) )
				604	return posixLockingStyle;
				605
				606	if(!strcmp(fsInfo.f_fstypename, "afpfs"))
				607	return afpLockingStyle;
				608
				609	if(!strcmp(fsInfo.f_fstypename, "nfs"))
				610	return sqlite3TestLockingStyle(filePath, fd);
				611
				612	if(!strcmp(fsInfo.f_fstypename, "smbfs"))
				613	return flockLockingStyle;
				614
				615	if(!strcmp(fsInfo.f_fstypename, "msdos"))
				616	return dotlockLockingStyle;
				617
				618	if(!strcmp(fsInfo.f_fstypename, "webdav"))
				619	return unsupportedLockingStyle;
				620
				621	return sqlite3TestLockingStyle(filePath, fd);
				622	#endif // SQLITE_FIXED_LOCKING_STYLE
				623	}
				624
				625	#endif /* SQLITE_ENABLE_LOCKING_STYLE */
				626
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	627	/*
				628	** Given a file descriptor, locate lockInfo and openCnt structures that
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	629	** describes that file descriptor. Create new ones if necessary. The
				630	** return values might be uninitialized if an error occurs.
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	631	**
				632	** Return the number of errors.
				633	*/
drh	38f8271	2004-06-18 17:10:16 +0000	[diff] [blame]	634	static int findLockInfo(
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	635	int fd, /* The file descriptor used in the key */
				636	struct lockInfo *ppLock, / Return the lockInfo structure here */
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	637	struct openCnt *ppOpen / Return the openCnt structure here */
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	638	){
				639	int rc;
				640	struct lockKey key1;
				641	struct openKey key2;
				642	struct stat statbuf;
				643	struct lockInfo *pLock;
				644	struct openCnt *pOpen;
				645	rc = fstat(fd, &statbuf);
				646	if( rc!=0 ) return 1;
danielk1977	441b09a	2006-01-05 13:48:29 +0000	[diff] [blame]	647
drh	757b04e	2006-01-18 17:25:45 +0000	[diff] [blame]	648	assert( sqlite3OsInMutex(1) );
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	649	memset(&key1, 0, sizeof(key1));
				650	key1.dev = statbuf.st_dev;
				651	key1.ino = statbuf.st_ino;
drh	5fdae77	2004-06-29 03:29:00 +0000	[diff] [blame]	652	#ifdef SQLITE_UNIX_THREADS
				653	if( threadsOverrideEachOthersLocks<0 ){
				654	testThreadLockingBehavior(fd);
				655	}
				656	key1.tid = threadsOverrideEachOthersLocks ? 0 : pthread_self();
				657	#endif
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	658	memset(&key2, 0, sizeof(key2));
				659	key2.dev = statbuf.st_dev;
				660	key2.ino = statbuf.st_ino;
				661	pLock = (struct lockInfo*)sqlite3HashFind(&lockHash, &key1, sizeof(key1));
				662	if( pLock==0 ){
				663	struct lockInfo *pOld;
danielk1977	750b03e	2006-02-14 10:48:39 +0000	[diff] [blame]	664	pLock = sqlite3ThreadSafeMalloc( sizeof(*pLock) );
danielk1977	441b09a	2006-01-05 13:48:29 +0000	[diff] [blame]	665	if( pLock==0 ){
				666	rc = 1;
				667	goto exit_findlockinfo;
				668	}
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	669	pLock->key = key1;
				670	pLock->nRef = 1;
				671	pLock->cnt = 0;
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	672	pLock->locktype = 0;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	673	pOld = sqlite3HashInsert(&lockHash, &pLock->key, sizeof(key1), pLock);
				674	if( pOld!=0 ){
				675	assert( pOld==pLock );
danielk1977	750b03e	2006-02-14 10:48:39 +0000	[diff] [blame]	676	sqlite3ThreadSafeFree(pLock);
danielk1977	441b09a	2006-01-05 13:48:29 +0000	[diff] [blame]	677	rc = 1;
				678	goto exit_findlockinfo;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	679	}
				680	}else{
				681	pLock->nRef++;
				682	}
				683	*ppLock = pLock;
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	684	if( ppOpen!=0 ){
				685	pOpen = (struct openCnt*)sqlite3HashFind(&openHash, &key2, sizeof(key2));
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	686	if( pOpen==0 ){
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	687	struct openCnt *pOld;
danielk1977	750b03e	2006-02-14 10:48:39 +0000	[diff] [blame]	688	pOpen = sqlite3ThreadSafeMalloc( sizeof(*pOpen) );
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	689	if( pOpen==0 ){
				690	releaseLockInfo(pLock);
				691	rc = 1;
				692	goto exit_findlockinfo;
				693	}
				694	pOpen->key = key2;
				695	pOpen->nRef = 1;
				696	pOpen->nLock = 0;
				697	pOpen->nPending = 0;
				698	pOpen->aPending = 0;
				699	pOld = sqlite3HashInsert(&openHash, &pOpen->key, sizeof(key2), pOpen);
				700	if( pOld!=0 ){
				701	assert( pOld==pOpen );
danielk1977	750b03e	2006-02-14 10:48:39 +0000	[diff] [blame]	702	sqlite3ThreadSafeFree(pOpen);
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	703	releaseLockInfo(pLock);
				704	rc = 1;
				705	goto exit_findlockinfo;
				706	}
				707	}else{
				708	pOpen->nRef++;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	709	}
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	710	*ppOpen = pOpen;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	711	}
danielk1977	441b09a	2006-01-05 13:48:29 +0000	[diff] [blame]	712
				713	exit_findlockinfo:
danielk1977	441b09a	2006-01-05 13:48:29 +0000	[diff] [blame]	714	return rc;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	715	}
				716
drh	64b1bea	2006-01-15 02:30:57 +0000	[diff] [blame]	717	#ifdef SQLITE_DEBUG
				718	/*
				719	** Helper function for printing out trace information from debugging
				720	** binaries. This returns the string represetation of the supplied
				721	** integer lock-type.
				722	*/
				723	static const char *locktypeName(int locktype){
				724	switch( locktype ){
				725	case NO_LOCK: return "NONE";
				726	case SHARED_LOCK: return "SHARED";
				727	case RESERVED_LOCK: return "RESERVED";
				728	case PENDING_LOCK: return "PENDING";
				729	case EXCLUSIVE_LOCK: return "EXCLUSIVE";
				730	}
				731	return "ERROR";
				732	}
				733	#endif
				734
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	735	/*
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	736	** If we are currently in a different thread than the thread that the
				737	** unixFile argument belongs to, then transfer ownership of the unixFile
				738	** over to the current thread.
				739	**
				740	** A unixFile is only owned by a thread on systems where one thread is
				741	** unable to override locks created by a different thread. RedHat9 is
				742	** an example of such a system.
				743	**
				744	** Ownership transfer is only allowed if the unixFile is currently unlocked.
				745	** If the unixFile is locked and an ownership is wrong, then return
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	746	** SQLITE_MISUSE. SQLITE_OK is returned if everything works.
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	747	*/
				748	#ifdef SQLITE_UNIX_THREADS
				749	static int transferOwnership(unixFile *pFile){
drh	64b1bea	2006-01-15 02:30:57 +0000	[diff] [blame]	750	int rc;
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	751	pthread_t hSelf;
				752	if( threadsOverrideEachOthersLocks ){
				753	/* Ownership transfers not needed on this system */
				754	return SQLITE_OK;
				755	}
				756	hSelf = pthread_self();
				757	if( pthread_equal(pFile->tid, hSelf) ){
				758	/* We are still in the same thread */
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	759	OSTRACE1("No-transfer, same thread\n");
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	760	return SQLITE_OK;
				761	}
				762	if( pFile->locktype!=NO_LOCK ){
				763	/* We cannot change ownership while we are holding a lock! */
				764	return SQLITE_MISUSE;
				765	}
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	766	OSTRACE4("Transfer ownership of %d from %d to %d\n",
				767	pFile->h, pFile->tid, hSelf);
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	768	pFile->tid = hSelf;
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	769	if (pFile->pLock != NULL) {
				770	releaseLockInfo(pFile->pLock);
				771	rc = findLockInfo(pFile->h, &pFile->pLock, 0);
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	772	OSTRACE5("LOCK %d is now %s(%s,%d)\n", pFile->h,
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	773	locktypeName(pFile->locktype),
				774	locktypeName(pFile->pLock->locktype), pFile->pLock->cnt);
				775	return rc;
				776	} else {
				777	return SQLITE_OK;
				778	}
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	779	}
				780	#else
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	781	/* On single-threaded builds, ownership transfer is a no-op */
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	782	# define transferOwnership(X) SQLITE_OK
				783	#endif
				784
				785	/*
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	786	** Delete the named file
				787	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	788	int sqlite3UnixDelete(const char *zFilename){
danielk1977	979f38e	2007-03-27 16:19:51 +0000	[diff] [blame]	789	SimulateIOError(return SQLITE_IOERR_DELETE);
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	790	unlink(zFilename);
				791	return SQLITE_OK;
				792	}
				793
				794	/*
				795	** Return TRUE if the named file exists.
				796	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	797	int sqlite3UnixFileExists(const char *zFilename){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	798	return access(zFilename, 0)==0;
				799	}
				800
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	801	/* Forward declaration */
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	802	static int allocateUnixFile(
				803	int h, /* File descriptor of the open file */
				804	OsFile *pId, / Write the real file descriptor here */
				805	const char zFilename, / Name of the file being opened */
				806	int delFlag /* If true, make sure the file deletes on close */
				807	);
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	808
				809	/*
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	810	** Attempt to open a file for both reading and writing. If that
				811	** fails, try opening it read-only. If the file does not exist,
				812	** try to create it.
				813	**
				814	** On success, a handle for the open file is written to *id
				815	** and *pReadonly is set to 0 if the file was opened for reading and
				816	** writing or 1 if the file was opened read-only. The function returns
				817	** SQLITE_OK.
				818	**
				819	** On failure, the function returns SQLITE_CANTOPEN and leaves
				820	** id and pReadonly unchanged.
				821	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	822	int sqlite3UnixOpenReadWrite(
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	823	const char *zFilename,
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	824	OsFile **pId,
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	825	int *pReadonly
				826	){
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	827	int h;
				828
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	829	CRASH_TEST_OVERRIDE(sqlite3CrashOpenReadWrite, zFilename, pId, pReadonly);
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	830	assert( 0==*pId );
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	831	h = open(zFilename, O_RDWR\|O_CREAT\|O_LARGEFILE\|O_BINARY,
				832	SQLITE_DEFAULT_FILE_PERMISSIONS);
				833	if( h<0 ){
drh	6458e39	2004-07-20 01:14:13 +0000	[diff] [blame]	834	#ifdef EISDIR
				835	if( errno==EISDIR ){
				836	return SQLITE_CANTOPEN;
				837	}
				838	#endif
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	839	h = open(zFilename, O_RDONLY\|O_LARGEFILE\|O_BINARY);
				840	if( h<0 ){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	841	return SQLITE_CANTOPEN;
				842	}
				843	*pReadonly = 1;
				844	}else{
				845	*pReadonly = 0;
				846	}
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	847	return allocateUnixFile(h, pId, zFilename, 0);
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	848	}
				849
				850
				851	/*
				852	** Attempt to open a new file for exclusive access by this process.
				853	** The file will be opened for both reading and writing. To avoid
				854	** a potential security problem, we do not allow the file to have
				855	** previously existed. Nor do we allow the file to be a symbolic
				856	** link.
				857	**
				858	** If delFlag is true, then make arrangements to automatically delete
				859	** the file when it is closed.
				860	**
				861	** On success, write the file handle into *id and return SQLITE_OK.
				862	**
				863	** On failure, return SQLITE_CANTOPEN.
				864	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	865	int sqlite3UnixOpenExclusive(const char zFilename, OsFile *pId, int delFlag){
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	866	int h;
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	867
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	868	CRASH_TEST_OVERRIDE(sqlite3CrashOpenExclusive, zFilename, pId, delFlag);
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	869	assert( 0==*pId );
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	870	h = open(zFilename,
drh	d645967	2005-08-13 17:17:01 +0000	[diff] [blame]	871	O_RDWR\|O_CREAT\|O_EXCL\|O_NOFOLLOW\|O_LARGEFILE\|O_BINARY,
drh	3f56e6e	2007-03-15 01:16:47 +0000	[diff] [blame]	872	delFlag ? 0600 : SQLITE_DEFAULT_FILE_PERMISSIONS);
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	873	if( h<0 ){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	874	return SQLITE_CANTOPEN;
				875	}
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	876	return allocateUnixFile(h, pId, zFilename, delFlag);
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	877	}
				878
				879	/*
				880	** Attempt to open a new file for read-only access.
				881	**
				882	** On success, write the file handle into *id and return SQLITE_OK.
				883	**
				884	** On failure, return SQLITE_CANTOPEN.
				885	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	886	int sqlite3UnixOpenReadOnly(const char zFilename, OsFile *pId){
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	887	int h;
				888
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	889	CRASH_TEST_OVERRIDE(sqlite3CrashOpenReadOnly, zFilename, pId, 0);
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	890	assert( 0==*pId );
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	891	h = open(zFilename, O_RDONLY\|O_LARGEFILE\|O_BINARY);
				892	if( h<0 ){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	893	return SQLITE_CANTOPEN;
				894	}
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	895	return allocateUnixFile(h, pId, zFilename, 0);
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	896	}
				897
				898	/*
				899	** Attempt to open a file descriptor for the directory that contains a
				900	** file. This file descriptor can be used to fsync() the directory
				901	** in order to make sure the creation of a new file is actually written
				902	** to disk.
				903	**
				904	** This routine is only meaningful for Unix. It is a no-op under
				905	** windows since windows does not support hard links.
				906	**
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	907	** If FULL_FSYNC is enabled, this function is not longer useful,
				908	** a FULL_FSYNC sync applies to all pending disk operations.
				909	**
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	910	** On success, a handle for a previously open file at *id is
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	911	** updated with the new directory file descriptor and SQLITE_OK is
				912	** returned.
				913	**
				914	** On failure, the function returns SQLITE_CANTOPEN and leaves
				915	** *id unchanged.
				916	*/
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	917	static int unixOpenDirectory(
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	918	OsFile *id,
				919	const char *zDirname
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	920	){
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	921	unixFile pFile = (unixFile)id;
				922	if( pFile==0 ){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	923	/* Do not open the directory if the corresponding file is not already
				924	** open. */
				925	return SQLITE_CANTOPEN;
				926	}
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	927	SET_THREADID(pFile);
				928	assert( pFile->dirfd<0 );
				929	pFile->dirfd = open(zDirname, O_RDONLY\|O_BINARY, 0);
				930	if( pFile->dirfd<0 ){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	931	return SQLITE_CANTOPEN;
				932	}
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	933	OSTRACE3("OPENDIR %-3d %s\n", pFile->dirfd, zDirname);
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	934	return SQLITE_OK;
				935	}
				936
				937	/*
				938	** Create a temporary file name in zBuf. zBuf must be big enough to
				939	** hold at least SQLITE_TEMPNAME_SIZE characters.
				940	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	941	int sqlite3UnixTempFileName(char *zBuf){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	942	static const char *azDirs[] = {
drh	ab3f9fe	2004-08-14 17:10:10 +0000	[diff] [blame]	943	0,
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	944	"/var/tmp",
				945	"/usr/tmp",
				946	"/tmp",
				947	".",
				948	};
drh	5719628	2004-10-06 15:41:16 +0000	[diff] [blame]	949	static const unsigned char zChars[] =
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	950	"abcdefghijklmnopqrstuvwxyz"
				951	"ABCDEFGHIJKLMNOPQRSTUVWXYZ"
				952	"0123456789";
				953	int i, j;
				954	struct stat buf;
				955	const char *zDir = ".";
drh	effd02b	2004-08-29 23:42:13 +0000	[diff] [blame]	956	azDirs[0] = sqlite3_temp_directory;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	957	for(i=0; i<sizeof(azDirs)/sizeof(azDirs[0]); i++){
drh	ab3f9fe	2004-08-14 17:10:10 +0000	[diff] [blame]	958	if( azDirs[i]==0 ) continue;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	959	if( stat(azDirs[i], &buf) ) continue;
				960	if( !S_ISDIR(buf.st_mode) ) continue;
				961	if( access(azDirs[i], 07) ) continue;
				962	zDir = azDirs[i];
				963	break;
				964	}
				965	do{
				966	sprintf(zBuf, "%s/"TEMP_FILE_PREFIX, zDir);
				967	j = strlen(zBuf);
				968	sqlite3Randomness(15, &zBuf[j]);
				969	for(i=0; i<15; i++, j++){
				970	zBuf[j] = (char)zChars[ ((unsigned char)zBuf[j])%(sizeof(zChars)-1) ];
				971	}
				972	zBuf[j] = 0;
				973	}while( access(zBuf,0)==0 );
				974	return SQLITE_OK;
				975	}
				976
				977	/*
tpoindex	9a09a3c	2004-12-20 19:01:32 +0000	[diff] [blame]	978	** Check that a given pathname is a directory and is writable
				979	**
				980	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	981	int sqlite3UnixIsDirWritable(char *zBuf){
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	982	#ifndef SQLITE_OMIT_PAGER_PRAGMAS
tpoindex	9a09a3c	2004-12-20 19:01:32 +0000	[diff] [blame]	983	struct stat buf;
				984	if( zBuf==0 ) return 0;
drh	268283b	2005-01-08 15:44:25 +0000	[diff] [blame]	985	if( zBuf[0]==0 ) return 0;
tpoindex	9a09a3c	2004-12-20 19:01:32 +0000	[diff] [blame]	986	if( stat(zBuf, &buf) ) return 0;
				987	if( !S_ISDIR(buf.st_mode) ) return 0;
				988	if( access(zBuf, 07) ) return 0;
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	989	#endif /* SQLITE_OMIT_PAGER_PRAGMAS */
tpoindex	9a09a3c	2004-12-20 19:01:32 +0000	[diff] [blame]	990	return 1;
				991	}
				992
				993	/*
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	994	** Seek to the offset in id->offset then read cnt bytes into pBuf.
				995	** Return the number of bytes actually read. Update the offset.
				996	*/
				997	static int seekAndRead(unixFile id, void pBuf, int cnt){
				998	int got;
drh	8ebf670	2007-02-06 11:11:08 +0000	[diff] [blame]	999	i64 newOffset;
drh	15d00c4	2007-02-27 02:01:14 +0000	[diff] [blame]	1000	TIMER_START;
drh	8350a21	2007-03-22 15:22:06 +0000	[diff] [blame]	1001	#if defined(USE_PREAD)
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1002	got = pread(id->h, pBuf, cnt, id->offset);
drh	8350a21	2007-03-22 15:22:06 +0000	[diff] [blame]	1003	#elif defined(USE_PREAD64)
				1004	got = pread64(id->h, pBuf, cnt, id->offset);
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1005	#else
drh	8ebf670	2007-02-06 11:11:08 +0000	[diff] [blame]	1006	newOffset = lseek(id->h, id->offset, SEEK_SET);
				1007	if( newOffset!=id->offset ){
				1008	return -1;
				1009	}
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1010	got = read(id->h, pBuf, cnt);
				1011	#endif
drh	15d00c4	2007-02-27 02:01:14 +0000	[diff] [blame]	1012	TIMER_END;
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1013	OSTRACE5("READ %-3d %5d %7lld %d\n", id->h, got, id->offset, TIMER_ELAPSED);
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1014	if( got>0 ){
				1015	id->offset += got;
				1016	}
				1017	return got;
				1018	}
				1019
				1020	/*
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1021	** Read data from a file into a buffer. Return SQLITE_OK if all
				1022	** bytes were read successfully and SQLITE_IOERR if anything goes
				1023	** wrong.
				1024	*/
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	1025	static int unixRead(OsFile id, void pBuf, int amt){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1026	int got;
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	1027	assert( id );
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1028	got = seekAndRead((unixFile*)id, pBuf, amt);
drh	551b773	2006-11-06 21:20:25 +0000	[diff] [blame]	1029	SimulateIOError( got = -1 );
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1030	if( got==amt ){
				1031	return SQLITE_OK;
drh	4ac285a	2006-09-15 07:28:50 +0000	[diff] [blame]	1032	}else if( got<0 ){
				1033	return SQLITE_IOERR_READ;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1034	}else{
drh	bafda09	2007-01-03 23:36:22 +0000	[diff] [blame]	1035	memset(&((char*)pBuf)[got], 0, amt-got);
drh	4ac285a	2006-09-15 07:28:50 +0000	[diff] [blame]	1036	return SQLITE_IOERR_SHORT_READ;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1037	}
				1038	}
				1039
				1040	/*
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1041	** Seek to the offset in id->offset then read cnt bytes into pBuf.
				1042	** Return the number of bytes actually read. Update the offset.
				1043	*/
				1044	static int seekAndWrite(unixFile id, const void pBuf, int cnt){
				1045	int got;
drh	8ebf670	2007-02-06 11:11:08 +0000	[diff] [blame]	1046	i64 newOffset;
drh	15d00c4	2007-02-27 02:01:14 +0000	[diff] [blame]	1047	TIMER_START;
drh	8350a21	2007-03-22 15:22:06 +0000	[diff] [blame]	1048	#if defined(USE_PREAD)
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1049	got = pwrite(id->h, pBuf, cnt, id->offset);
drh	8350a21	2007-03-22 15:22:06 +0000	[diff] [blame]	1050	#elif defined(USE_PREAD64)
				1051	got = pwrite64(id->h, pBuf, cnt, id->offset);
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1052	#else
drh	8ebf670	2007-02-06 11:11:08 +0000	[diff] [blame]	1053	newOffset = lseek(id->h, id->offset, SEEK_SET);
				1054	if( newOffset!=id->offset ){
				1055	return -1;
				1056	}
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1057	got = write(id->h, pBuf, cnt);
				1058	#endif
drh	15d00c4	2007-02-27 02:01:14 +0000	[diff] [blame]	1059	TIMER_END;
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1060	OSTRACE5("WRITE %-3d %5d %7lld %d\n", id->h, got, id->offset, TIMER_ELAPSED);
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1061	if( got>0 ){
				1062	id->offset += got;
				1063	}
				1064	return got;
				1065	}
				1066
				1067
				1068	/*
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1069	** Write data from a buffer into a file. Return SQLITE_OK on success
				1070	** or some other error code on failure.
				1071	*/
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	1072	static int unixWrite(OsFile id, const void pBuf, int amt){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1073	int wrote = 0;
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	1074	assert( id );
drh	4c7f941	2005-02-03 00:29:47 +0000	[diff] [blame]	1075	assert( amt>0 );
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1076	while( amt>0 && (wrote = seekAndWrite((unixFile*)id, pBuf, amt))>0 ){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1077	amt -= wrote;
				1078	pBuf = &((char*)pBuf)[wrote];
				1079	}
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1080	SimulateIOError(( wrote=(-1), amt=1 ));
				1081	SimulateDiskfullError(( wrote=0, amt=1 ));
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1082	if( amt>0 ){
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1083	if( wrote<0 ){
drh	4ac285a	2006-09-15 07:28:50 +0000	[diff] [blame]	1084	return SQLITE_IOERR_WRITE;
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1085	}else{
				1086	return SQLITE_FULL;
				1087	}
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1088	}
				1089	return SQLITE_OK;
				1090	}
				1091
				1092	/*
				1093	** Move the read/write pointer in a file.
				1094	*/
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	1095	static int unixSeek(OsFile *id, i64 offset){
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	1096	assert( id );
drh	b4746b9	2005-09-09 01:32:06 +0000	[diff] [blame]	1097	#ifdef SQLITE_TEST
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1098	if( offset ) SimulateDiskfullError(return SQLITE_FULL);
drh	b4746b9	2005-09-09 01:32:06 +0000	[diff] [blame]	1099	#endif
drh	b912b28	2006-03-23 22:42:20 +0000	[diff] [blame]	1100	((unixFile*)id)->offset = offset;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1101	return SQLITE_OK;
				1102	}
				1103
drh	b851b2c	2005-03-10 14:11:12 +0000	[diff] [blame]	1104	#ifdef SQLITE_TEST
				1105	/*
				1106	** Count the number of fullsyncs and normal syncs. This is used to test
				1107	** that syncs and fullsyncs are occuring at the right times.
				1108	*/
				1109	int sqlite3_sync_count = 0;
				1110	int sqlite3_fullsync_count = 0;
				1111	#endif
				1112
drh	f2f2391	2005-10-05 10:29:36 +0000	[diff] [blame]	1113	/*
				1114	** Use the fdatasync() API only if the HAVE_FDATASYNC macro is defined.
				1115	** Otherwise use fsync() in its place.
				1116	*/
				1117	#ifndef HAVE_FDATASYNC
				1118	# define fdatasync fsync
				1119	#endif
				1120
drh	ac530b1	2006-02-11 01:25:50 +0000	[diff] [blame]	1121	/*
				1122	** Define HAVE_FULLFSYNC to 0 or 1 depending on whether or not
				1123	** the F_FULLFSYNC macro is defined. F_FULLFSYNC is currently
				1124	** only available on Mac OS X. But that could change.
				1125	*/
				1126	#ifdef F_FULLFSYNC
				1127	# define HAVE_FULLFSYNC 1
				1128	#else
				1129	# define HAVE_FULLFSYNC 0
				1130	#endif
				1131
drh	b851b2c	2005-03-10 14:11:12 +0000	[diff] [blame]	1132
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1133	/*
drh	dd809b0	2004-07-17 21:44:57 +0000	[diff] [blame]	1134	** The fsync() system call does not work as advertised on many
				1135	** unix systems. The following procedure is an attempt to make
				1136	** it work better.
drh	1398ad3	2005-01-19 23:24:50 +0000	[diff] [blame]	1137	**
				1138	** The SQLITE_NO_SYNC macro disables all fsync()s. This is useful
				1139	** for testing when we want to run through the test suite quickly.
				1140	** You are strongly advised not to deploy with SQLITE_NO_SYNC
				1141	** enabled, however, since with SQLITE_NO_SYNC enabled, an OS crash
				1142	** or power failure will likely corrupt the database file.
drh	dd809b0	2004-07-17 21:44:57 +0000	[diff] [blame]	1143	*/
drh	eb796a7	2005-09-08 12:38:41 +0000	[diff] [blame]	1144	static int full_fsync(int fd, int fullSync, int dataOnly){
drh	dd809b0	2004-07-17 21:44:57 +0000	[diff] [blame]	1145	int rc;
drh	b851b2c	2005-03-10 14:11:12 +0000	[diff] [blame]	1146
				1147	/* Record the number of times that we do a normal fsync() and
				1148	** FULLSYNC. This is used during testing to verify that this procedure
				1149	** gets called with the correct arguments.
				1150	*/
				1151	#ifdef SQLITE_TEST
				1152	if( fullSync ) sqlite3_fullsync_count++;
				1153	sqlite3_sync_count++;
				1154	#endif
				1155
				1156	/* If we compiled with the SQLITE_NO_SYNC flag, then syncing is a
				1157	** no-op
				1158	*/
				1159	#ifdef SQLITE_NO_SYNC
				1160	rc = SQLITE_OK;
				1161	#else
				1162
drh	ac530b1	2006-02-11 01:25:50 +0000	[diff] [blame]	1163	#if HAVE_FULLFSYNC
drh	b851b2c	2005-03-10 14:11:12 +0000	[diff] [blame]	1164	if( fullSync ){
drh	f30cc94	2005-03-11 17:52:34 +0000	[diff] [blame]	1165	rc = fcntl(fd, F_FULLFSYNC, 0);
aswift	ae0943b	2007-01-31 23:37:07 +0000	[diff] [blame]	1166	}else{
				1167	rc = 1;
				1168	}
				1169	/* If the FULLFSYNC failed, fall back to attempting an fsync().
				1170	* It shouldn't be possible for fullfsync to fail on the local
				1171	* file system (on OSX), so failure indicates that FULLFSYNC
				1172	* isn't supported for this file system. So, attempt an fsync
				1173	* and (for now) ignore the overhead of a superfluous fcntl call.
				1174	* It'd be better to detect fullfsync support once and avoid
				1175	* the fcntl call every time sync is called.
				1176	*/
				1177	if( rc ) rc = fsync(fd);
				1178
				1179	#else
drh	eb796a7	2005-09-08 12:38:41 +0000	[diff] [blame]	1180	if( dataOnly ){
				1181	rc = fdatasync(fd);
drh	f2f2391	2005-10-05 10:29:36 +0000	[diff] [blame]	1182	}else{
drh	eb796a7	2005-09-08 12:38:41 +0000	[diff] [blame]	1183	rc = fsync(fd);
				1184	}
aswift	ae0943b	2007-01-31 23:37:07 +0000	[diff] [blame]	1185	#endif /* HAVE_FULLFSYNC */
drh	b851b2c	2005-03-10 14:11:12 +0000	[diff] [blame]	1186	#endif /* defined(SQLITE_NO_SYNC) */
				1187
drh	dd809b0	2004-07-17 21:44:57 +0000	[diff] [blame]	1188	return rc;
				1189	}
				1190
				1191	/*
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1192	** Make sure all writes to a particular file are committed to disk.
				1193	**
drh	eb796a7	2005-09-08 12:38:41 +0000	[diff] [blame]	1194	** If dataOnly==0 then both the file itself and its metadata (file
				1195	** size, access time, etc) are synced. If dataOnly!=0 then only the
				1196	** file data is synced.
				1197	**
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1198	** Under Unix, also make sure that the directory entry for the file
				1199	** has been created by fsync-ing the directory that contains the file.
				1200	** If we do not do this and we encounter a power failure, the directory
				1201	** entry for the journal might not exist after we reboot. The next
				1202	** SQLite to access the file will not know that the journal exists (because
				1203	** the directory entry for the journal was never created) and the transaction
				1204	** will not roll back - possibly leading to database corruption.
				1205	*/
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	1206	static int unixSync(OsFile *id, int dataOnly){
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1207	int rc;
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1208	unixFile pFile = (unixFile)id;
				1209	assert( pFile );
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1210	OSTRACE2("SYNC %-3d\n", pFile->h);
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1211	rc = full_fsync(pFile->h, pFile->fullSync, dataOnly);
				1212	SimulateIOError( rc=1 );
				1213	if( rc ){
drh	4ac285a	2006-09-15 07:28:50 +0000	[diff] [blame]	1214	return SQLITE_IOERR_FSYNC;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1215	}
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1216	if( pFile->dirfd>=0 ){
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1217	OSTRACE4("DIRSYNC %-3d (have_fullfsync=%d fullsync=%d)\n", pFile->dirfd,
drh	ac530b1	2006-02-11 01:25:50 +0000	[diff] [blame]	1218	HAVE_FULLFSYNC, pFile->fullSync);
danielk1977	d7c03f7	2005-11-25 10:38:22 +0000	[diff] [blame]	1219	#ifndef SQLITE_DISABLE_DIRSYNC
drh	ac530b1	2006-02-11 01:25:50 +0000	[diff] [blame]	1220	/* The directory sync is only attempted if full_fsync is
				1221	** turned off or unavailable. If a full_fsync occurred above,
				1222	** then the directory sync is superfluous.
				1223	*/
				1224	if( (!HAVE_FULLFSYNC \|\| !pFile->fullSync) && full_fsync(pFile->dirfd,0,0) ){
				1225	/*
				1226	** We have received multiple reports of fsync() returning
drh	86631a5	2006-02-09 23:05:51 +0000	[diff] [blame]	1227	** errors when applied to directories on certain file systems.
				1228	** A failed directory sync is not a big deal. So it seems
				1229	** better to ignore the error. Ticket #1657
				1230	*/
				1231	/* return SQLITE_IOERR; */
danielk1977	0964b23	2005-11-25 08:47:57 +0000	[diff] [blame]	1232	}
danielk1977	d7c03f7	2005-11-25 10:38:22 +0000	[diff] [blame]	1233	#endif
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1234	close(pFile->dirfd); /* Only need to sync once, so close the directory */
				1235	pFile->dirfd = -1; /* when we are done. */
drh	a285422	2004-06-17 19:04:17 +0000	[diff] [blame]	1236	}
drh	a285422	2004-06-17 19:04:17 +0000	[diff] [blame]	1237	return SQLITE_OK;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1238	}
				1239
				1240	/*
danielk1977	962398d	2004-06-14 09:35:16 +0000	[diff] [blame]	1241	** Sync the directory zDirname. This is a no-op on operating systems other
				1242	** than UNIX.
drh	b851b2c	2005-03-10 14:11:12 +0000	[diff] [blame]	1243	**
				1244	** This is used to make sure the master journal file has truely been deleted
				1245	** before making changes to individual journals on a multi-database commit.
drh	f30cc94	2005-03-11 17:52:34 +0000	[diff] [blame]	1246	** The F_FULLFSYNC option is not needed here.
danielk1977	962398d	2004-06-14 09:35:16 +0000	[diff] [blame]	1247	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	1248	int sqlite3UnixSyncDirectory(const char *zDirname){
danielk1977	d7c03f7	2005-11-25 10:38:22 +0000	[diff] [blame]	1249	#ifdef SQLITE_DISABLE_DIRSYNC
				1250	return SQLITE_OK;
				1251	#else
danielk1977	962398d	2004-06-14 09:35:16 +0000	[diff] [blame]	1252	int fd;
				1253	int r;
drh	8e85577	2005-05-17 11:25:31 +0000	[diff] [blame]	1254	fd = open(zDirname, O_RDONLY\|O_BINARY, 0);
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1255	OSTRACE3("DIRSYNC %-3d (%s)\n", fd, zDirname);
danielk1977	962398d	2004-06-14 09:35:16 +0000	[diff] [blame]	1256	if( fd<0 ){
				1257	return SQLITE_CANTOPEN;
				1258	}
				1259	r = fsync(fd);
				1260	close(fd);
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1261	SimulateIOError( r=1 );
				1262	if( r ){
drh	4ac285a	2006-09-15 07:28:50 +0000	[diff] [blame]	1263	return SQLITE_IOERR_DIR_FSYNC;
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1264	}else{
				1265	return SQLITE_OK;
				1266	}
danielk1977	d7c03f7	2005-11-25 10:38:22 +0000	[diff] [blame]	1267	#endif
danielk1977	962398d	2004-06-14 09:35:16 +0000	[diff] [blame]	1268	}
				1269
				1270	/*
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1271	** Truncate an open file to a specified size
				1272	*/
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	1273	static int unixTruncate(OsFile *id, i64 nByte){
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1274	int rc;
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	1275	assert( id );
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1276	rc = ftruncate(((unixFile*)id)->h, nByte);
				1277	SimulateIOError( rc=1 );
				1278	if( rc ){
drh	4ac285a	2006-09-15 07:28:50 +0000	[diff] [blame]	1279	return SQLITE_IOERR_TRUNCATE;
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1280	}else{
				1281	return SQLITE_OK;
				1282	}
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1283	}
				1284
				1285	/*
				1286	** Determine the current size of a file in bytes
				1287	*/
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	1288	static int unixFileSize(OsFile id, i64 pSize){
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1289	int rc;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1290	struct stat buf;
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	1291	assert( id );
drh	5968593	2006-09-14 13:47:11 +0000	[diff] [blame]	1292	rc = fstat(((unixFile*)id)->h, &buf);
				1293	SimulateIOError( rc=1 );
				1294	if( rc!=0 ){
drh	4ac285a	2006-09-15 07:28:50 +0000	[diff] [blame]	1295	return SQLITE_IOERR_FSTAT;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1296	}
				1297	*pSize = buf.st_size;
				1298	return SQLITE_OK;
				1299	}
				1300
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1301	/*
danielk1977	13adf8a	2004-06-03 16:08:41 +0000	[diff] [blame]	1302	** This routine checks if there is a RESERVED lock held on the specified
				1303	** file by this or any other process. If such a lock is held, return
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1304	** non-zero. If the file is unlocked or holds only SHARED locks, then
				1305	** return zero.
danielk1977	13adf8a	2004-06-03 16:08:41 +0000	[diff] [blame]	1306	*/
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	1307	static int unixCheckReservedLock(OsFile *id){
danielk1977	13adf8a	2004-06-03 16:08:41 +0000	[diff] [blame]	1308	int r = 0;
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1309	unixFile pFile = (unixFile)id;
danielk1977	13adf8a	2004-06-03 16:08:41 +0000	[diff] [blame]	1310
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1311	assert( pFile );
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	1312	sqlite3OsEnterMutex(); /* Because pFile->pLock is shared across threads */
danielk1977	13adf8a	2004-06-03 16:08:41 +0000	[diff] [blame]	1313
				1314	/* Check if a thread in this process holds such a lock */
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1315	if( pFile->pLock->locktype>SHARED_LOCK ){
danielk1977	13adf8a	2004-06-03 16:08:41 +0000	[diff] [blame]	1316	r = 1;
				1317	}
				1318
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1319	/* Otherwise see if some other process holds it.
danielk1977	13adf8a	2004-06-03 16:08:41 +0000	[diff] [blame]	1320	*/
				1321	if( !r ){
				1322	struct flock lock;
				1323	lock.l_whence = SEEK_SET;
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1324	lock.l_start = RESERVED_BYTE;
				1325	lock.l_len = 1;
				1326	lock.l_type = F_WRLCK;
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1327	fcntl(pFile->h, F_GETLK, &lock);
danielk1977	13adf8a	2004-06-03 16:08:41 +0000	[diff] [blame]	1328	if( lock.l_type!=F_UNLCK ){
				1329	r = 1;
				1330	}
				1331	}
				1332
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	1333	sqlite3OsLeaveMutex();
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1334	OSTRACE3("TEST WR-LOCK %d %d\n", pFile->h, r);
danielk1977	13adf8a	2004-06-03 16:08:41 +0000	[diff] [blame]	1335
				1336	return r;
				1337	}
				1338
				1339	/*
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1340	** Lock the file with the lock specified by parameter locktype - one
				1341	** of the following:
				1342	**
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1343	** (1) SHARED_LOCK
				1344	** (2) RESERVED_LOCK
				1345	** (3) PENDING_LOCK
				1346	** (4) EXCLUSIVE_LOCK
				1347	**
drh	b3e0434	2004-06-08 00:47:47 +0000	[diff] [blame]	1348	** Sometimes when requesting one lock state, additional lock states
				1349	** are inserted in between. The locking might fail on one of the later
				1350	** transitions leaving the lock state different from what it started but
				1351	** still short of its goal. The following chart shows the allowed
				1352	** transitions and the inserted intermediate states:
				1353	**
				1354	** UNLOCKED -> SHARED
				1355	** SHARED -> RESERVED
				1356	** SHARED -> (PENDING) -> EXCLUSIVE
				1357	** RESERVED -> (PENDING) -> EXCLUSIVE
				1358	** PENDING -> EXCLUSIVE
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1359	**
drh	a6abd04	2004-06-09 17:37:22 +0000	[diff] [blame]	1360	** This routine will only increase a lock. Use the sqlite3OsUnlock()
				1361	** routine to lower a locking level.
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1362	*/
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	1363	static int unixLock(OsFile *id, int locktype){
danielk1977	f42f25c	2004-06-25 07:21:28 +0000	[diff] [blame]	1364	/* The following describes the implementation of the various locks and
				1365	** lock transitions in terms of the POSIX advisory shared and exclusive
				1366	** lock primitives (called read-locks and write-locks below, to avoid
				1367	** confusion with SQLite lock names). The algorithms are complicated
				1368	** slightly in order to be compatible with windows systems simultaneously
				1369	** accessing the same database file, in case that is ever required.
				1370	**
				1371	** Symbols defined in os.h indentify the 'pending byte' and the 'reserved
				1372	** byte', each single bytes at well known offsets, and the 'shared byte
				1373	** range', a range of 510 bytes at a well known offset.
				1374	**
				1375	** To obtain a SHARED lock, a read-lock is obtained on the 'pending
				1376	** byte'. If this is successful, a random byte from the 'shared byte
				1377	** range' is read-locked and the lock on the 'pending byte' released.
				1378	**
danielk1977	90ba3bd	2004-06-25 08:32:25 +0000	[diff] [blame]	1379	** A process may only obtain a RESERVED lock after it has a SHARED lock.
				1380	** A RESERVED lock is implemented by grabbing a write-lock on the
				1381	** 'reserved byte'.
danielk1977	f42f25c	2004-06-25 07:21:28 +0000	[diff] [blame]	1382	**
				1383	** A process may only obtain a PENDING lock after it has obtained a
danielk1977	90ba3bd	2004-06-25 08:32:25 +0000	[diff] [blame]	1384	** SHARED lock. A PENDING lock is implemented by obtaining a write-lock
				1385	** on the 'pending byte'. This ensures that no new SHARED locks can be
				1386	** obtained, but existing SHARED locks are allowed to persist. A process
				1387	** does not have to obtain a RESERVED lock on the way to a PENDING lock.
				1388	** This property is used by the algorithm for rolling back a journal file
				1389	** after a crash.
danielk1977	f42f25c	2004-06-25 07:21:28 +0000	[diff] [blame]	1390	**
danielk1977	90ba3bd	2004-06-25 08:32:25 +0000	[diff] [blame]	1391	** An EXCLUSIVE lock, obtained after a PENDING lock is held, is
				1392	** implemented by obtaining a write-lock on the entire 'shared byte
				1393	** range'. Since all other locks require a read-lock on one of the bytes
				1394	** within this range, this ensures that no other locks are held on the
				1395	** database.
danielk1977	f42f25c	2004-06-25 07:21:28 +0000	[diff] [blame]	1396	**
				1397	** The reason a single byte cannot be used instead of the 'shared byte
				1398	** range' is that some versions of windows do not support read-locks. By
				1399	** locking a random byte from a range, concurrent SHARED locks may exist
				1400	** even if the locking primitive used is always a write-lock.
				1401	*/
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1402	int rc = SQLITE_OK;
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1403	unixFile pFile = (unixFile)id;
				1404	struct lockInfo *pLock = pFile->pLock;
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1405	struct flock lock;
				1406	int s;
				1407
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1408	assert( pFile );
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1409	OSTRACE7("LOCK %d %s was %s(%s,%d) pid=%d\n", pFile->h,
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1410	locktypeName(locktype), locktypeName(pFile->locktype),
				1411	locktypeName(pLock->locktype), pLock->cnt , getpid());
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1412
				1413	/* If there is already a lock of this type or more restrictive on the
				1414	** OsFile, do nothing. Don't use the end_lock: exit path, as
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	1415	** sqlite3OsEnterMutex() hasn't been called yet.
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1416	*/
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1417	if( pFile->locktype>=locktype ){
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1418	OSTRACE3("LOCK %d %s ok (already held)\n", pFile->h,
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1419	locktypeName(locktype));
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1420	return SQLITE_OK;
				1421	}
				1422
drh	b3e0434	2004-06-08 00:47:47 +0000	[diff] [blame]	1423	/* Make sure the locking sequence is correct
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1424	*/
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1425	assert( pFile->locktype!=NO_LOCK \|\| locktype==SHARED_LOCK );
drh	b3e0434	2004-06-08 00:47:47 +0000	[diff] [blame]	1426	assert( locktype!=PENDING_LOCK );
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1427	assert( locktype!=RESERVED_LOCK \|\| pFile->locktype==SHARED_LOCK );
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1428
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1429	/* This mutex is needed because pFile->pLock is shared across threads
drh	b3e0434	2004-06-08 00:47:47 +0000	[diff] [blame]	1430	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	1431	sqlite3OsEnterMutex();
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1432
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	1433	/* Make sure the current thread owns the pFile.
				1434	*/
				1435	rc = transferOwnership(pFile);
				1436	if( rc!=SQLITE_OK ){
				1437	sqlite3OsLeaveMutex();
				1438	return rc;
				1439	}
drh	64b1bea	2006-01-15 02:30:57 +0000	[diff] [blame]	1440	pLock = pFile->pLock;
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	1441
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1442	/* If some thread using this PID has a lock via a different OsFile*
				1443	** handle that precludes the requested lock, return BUSY.
				1444	*/
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1445	if( (pFile->locktype!=pLock->locktype &&
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1446	(pLock->locktype>=PENDING_LOCK \|\| locktype>SHARED_LOCK))
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1447	){
				1448	rc = SQLITE_BUSY;
				1449	goto end_lock;
				1450	}
				1451
				1452	/* If a SHARED lock is requested, and some thread using this PID already
				1453	** has a SHARED or RESERVED lock, then increment reference counts and
				1454	** return SQLITE_OK.
				1455	*/
				1456	if( locktype==SHARED_LOCK &&
				1457	(pLock->locktype==SHARED_LOCK \|\| pLock->locktype==RESERVED_LOCK) ){
				1458	assert( locktype==SHARED_LOCK );
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1459	assert( pFile->locktype==0 );
danielk1977	ecb2a96	2004-06-02 06:30:16 +0000	[diff] [blame]	1460	assert( pLock->cnt>0 );
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1461	pFile->locktype = SHARED_LOCK;
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1462	pLock->cnt++;
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1463	pFile->pOpen->nLock++;
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1464	goto end_lock;
				1465	}
				1466
danielk1977	13adf8a	2004-06-03 16:08:41 +0000	[diff] [blame]	1467	lock.l_len = 1L;
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	1468
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1469	lock.l_whence = SEEK_SET;
				1470
drh	3cde3bb	2004-06-12 02:17:14 +0000	[diff] [blame]	1471	/* A PENDING lock is needed before acquiring a SHARED lock and before
				1472	** acquiring an EXCLUSIVE lock. For the SHARED lock, the PENDING will
				1473	** be released.
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1474	*/
drh	3cde3bb	2004-06-12 02:17:14 +0000	[diff] [blame]	1475	if( locktype==SHARED_LOCK
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1476	\|\| (locktype==EXCLUSIVE_LOCK && pFile->locktype<PENDING_LOCK)
drh	3cde3bb	2004-06-12 02:17:14 +0000	[diff] [blame]	1477	){
danielk1977	489468c	2004-06-28 08:25:47 +0000	[diff] [blame]	1478	lock.l_type = (locktype==SHARED_LOCK?F_RDLCK:F_WRLCK);
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1479	lock.l_start = PENDING_BYTE;
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1480	s = fcntl(pFile->h, F_SETLK, &lock);
drh	e2396a1	2007-03-29 20:19:58 +0000	[diff] [blame]	1481	if( s==(-1) ){
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1482	rc = (errno==EINVAL) ? SQLITE_NOLFS : SQLITE_BUSY;
				1483	goto end_lock;
				1484	}
drh	3cde3bb	2004-06-12 02:17:14 +0000	[diff] [blame]	1485	}
				1486
				1487
				1488	/* If control gets to this point, then actually go ahead and make
				1489	** operating system calls for the specified lock.
				1490	*/
				1491	if( locktype==SHARED_LOCK ){
				1492	assert( pLock->cnt==0 );
				1493	assert( pLock->locktype==0 );
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1494
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1495	/* Now get the read-lock */
				1496	lock.l_start = SHARED_FIRST;
				1497	lock.l_len = SHARED_SIZE;
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1498	s = fcntl(pFile->h, F_SETLK, &lock);
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1499
				1500	/* Drop the temporary PENDING lock */
				1501	lock.l_start = PENDING_BYTE;
				1502	lock.l_len = 1L;
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1503	lock.l_type = F_UNLCK;
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1504	if( fcntl(pFile->h, F_SETLK, &lock)!=0 ){
drh	4ac285a	2006-09-15 07:28:50 +0000	[diff] [blame]	1505	rc = SQLITE_IOERR_UNLOCK; /* This should never happen */
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	1506	goto end_lock;
				1507	}
drh	e2396a1	2007-03-29 20:19:58 +0000	[diff] [blame]	1508	if( s==(-1) ){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1509	rc = (errno==EINVAL) ? SQLITE_NOLFS : SQLITE_BUSY;
				1510	}else{
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1511	pFile->locktype = SHARED_LOCK;
				1512	pFile->pOpen->nLock++;
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1513	pLock->cnt = 1;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1514	}
drh	3cde3bb	2004-06-12 02:17:14 +0000	[diff] [blame]	1515	}else if( locktype==EXCLUSIVE_LOCK && pLock->cnt>1 ){
				1516	/* We are trying for an exclusive lock but another thread in this
				1517	** same process is still holding a shared lock. */
				1518	rc = SQLITE_BUSY;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1519	}else{
drh	3cde3bb	2004-06-12 02:17:14 +0000	[diff] [blame]	1520	/* The request was for a RESERVED or EXCLUSIVE lock. It is
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1521	** assumed that there is a SHARED or greater lock on the file
				1522	** already.
				1523	*/
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1524	assert( 0!=pFile->locktype );
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1525	lock.l_type = F_WRLCK;
				1526	switch( locktype ){
				1527	case RESERVED_LOCK:
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1528	lock.l_start = RESERVED_BYTE;
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1529	break;
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1530	case EXCLUSIVE_LOCK:
drh	2ac3ee9	2004-06-07 16:27:46 +0000	[diff] [blame]	1531	lock.l_start = SHARED_FIRST;
				1532	lock.l_len = SHARED_SIZE;
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1533	break;
				1534	default:
				1535	assert(0);
				1536	}
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1537	s = fcntl(pFile->h, F_SETLK, &lock);
drh	e2396a1	2007-03-29 20:19:58 +0000	[diff] [blame]	1538	if( s==(-1) ){
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1539	rc = (errno==EINVAL) ? SQLITE_NOLFS : SQLITE_BUSY;
				1540	}
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1541	}
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1542
danielk1977	ecb2a96	2004-06-02 06:30:16 +0000	[diff] [blame]	1543	if( rc==SQLITE_OK ){
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1544	pFile->locktype = locktype;
danielk1977	ecb2a96	2004-06-02 06:30:16 +0000	[diff] [blame]	1545	pLock->locktype = locktype;
drh	3cde3bb	2004-06-12 02:17:14 +0000	[diff] [blame]	1546	}else if( locktype==EXCLUSIVE_LOCK ){
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1547	pFile->locktype = PENDING_LOCK;
drh	3cde3bb	2004-06-12 02:17:14 +0000	[diff] [blame]	1548	pLock->locktype = PENDING_LOCK;
danielk1977	ecb2a96	2004-06-02 06:30:16 +0000	[diff] [blame]	1549	}
danielk1977	9a1d0ab	2004-06-01 14:09:28 +0000	[diff] [blame]	1550
				1551	end_lock:
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	1552	sqlite3OsLeaveMutex();
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1553	OSTRACE4("LOCK %d %s %s\n", pFile->h, locktypeName(locktype),
danielk1977	2b44485	2004-06-29 07:45:33 +0000	[diff] [blame]	1554	rc==SQLITE_OK ? "ok" : "failed");
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1555	return rc;
				1556	}
				1557
				1558	/*
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1559	** Lower the locking level on file descriptor pFile to locktype. locktype
drh	a6abd04	2004-06-09 17:37:22 +0000	[diff] [blame]	1560	** must be either NO_LOCK or SHARED_LOCK.
				1561	**
				1562	** If the locking level of the file descriptor is already at or below
				1563	** the requested locking level, this routine is a no-op.
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1564	*/
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	1565	static int unixUnlock(OsFile *id, int locktype){
drh	a6abd04	2004-06-09 17:37:22 +0000	[diff] [blame]	1566	struct lockInfo *pLock;
				1567	struct flock lock;
drh	9c105bb	2004-10-02 20:38:28 +0000	[diff] [blame]	1568	int rc = SQLITE_OK;
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1569	unixFile pFile = (unixFile)id;
drh	a6abd04	2004-06-09 17:37:22 +0000	[diff] [blame]	1570
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1571	assert( pFile );
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1572	OSTRACE7("UNLOCK %d %d was %d(%d,%d) pid=%d\n", pFile->h, locktype,
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1573	pFile->locktype, pFile->pLock->locktype, pFile->pLock->cnt, getpid());
drh	a6abd04	2004-06-09 17:37:22 +0000	[diff] [blame]	1574
				1575	assert( locktype<=SHARED_LOCK );
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1576	if( pFile->locktype<=locktype ){
drh	a6abd04	2004-06-09 17:37:22 +0000	[diff] [blame]	1577	return SQLITE_OK;
				1578	}
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	1579	if( CHECK_THREADID(pFile) ){
				1580	return SQLITE_MISUSE;
				1581	}
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	1582	sqlite3OsEnterMutex();
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1583	pLock = pFile->pLock;
drh	a6abd04	2004-06-09 17:37:22 +0000	[diff] [blame]	1584	assert( pLock->cnt!=0 );
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1585	if( pFile->locktype>SHARED_LOCK ){
				1586	assert( pLock->locktype==pFile->locktype );
drh	9c105bb	2004-10-02 20:38:28 +0000	[diff] [blame]	1587	if( locktype==SHARED_LOCK ){
				1588	lock.l_type = F_RDLCK;
				1589	lock.l_whence = SEEK_SET;
				1590	lock.l_start = SHARED_FIRST;
				1591	lock.l_len = SHARED_SIZE;
drh	e2396a1	2007-03-29 20:19:58 +0000	[diff] [blame]	1592	if( fcntl(pFile->h, F_SETLK, &lock)==(-1) ){
drh	9c105bb	2004-10-02 20:38:28 +0000	[diff] [blame]	1593	/* This should never happen */
drh	4ac285a	2006-09-15 07:28:50 +0000	[diff] [blame]	1594	rc = SQLITE_IOERR_RDLOCK;
drh	9c105bb	2004-10-02 20:38:28 +0000	[diff] [blame]	1595	}
				1596	}
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1597	lock.l_type = F_UNLCK;
				1598	lock.l_whence = SEEK_SET;
drh	a6abd04	2004-06-09 17:37:22 +0000	[diff] [blame]	1599	lock.l_start = PENDING_BYTE;
				1600	lock.l_len = 2L; assert( PENDING_BYTE+1==RESERVED_BYTE );
drh	e2396a1	2007-03-29 20:19:58 +0000	[diff] [blame]	1601	if( fcntl(pFile->h, F_SETLK, &lock)!=(-1) ){
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	1602	pLock->locktype = SHARED_LOCK;
				1603	}else{
drh	4ac285a	2006-09-15 07:28:50 +0000	[diff] [blame]	1604	rc = SQLITE_IOERR_UNLOCK; /* This should never happen */
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	1605	}
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1606	}
drh	a6abd04	2004-06-09 17:37:22 +0000	[diff] [blame]	1607	if( locktype==NO_LOCK ){
				1608	struct openCnt *pOpen;
danielk1977	ecb2a96	2004-06-02 06:30:16 +0000	[diff] [blame]	1609
drh	a6abd04	2004-06-09 17:37:22 +0000	[diff] [blame]	1610	/* Decrement the shared lock counter. Release the lock using an
				1611	** OS call only when all threads in this same process have released
				1612	** the lock.
				1613	*/
				1614	pLock->cnt--;
				1615	if( pLock->cnt==0 ){
				1616	lock.l_type = F_UNLCK;
				1617	lock.l_whence = SEEK_SET;
				1618	lock.l_start = lock.l_len = 0L;
drh	e2396a1	2007-03-29 20:19:58 +0000	[diff] [blame]	1619	if( fcntl(pFile->h, F_SETLK, &lock)!=(-1) ){
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	1620	pLock->locktype = NO_LOCK;
				1621	}else{
drh	4ac285a	2006-09-15 07:28:50 +0000	[diff] [blame]	1622	rc = SQLITE_IOERR_UNLOCK; /* This should never happen */
drh	2b4b596	2005-06-15 17:47:55 +0000	[diff] [blame]	1623	}
drh	a6abd04	2004-06-09 17:37:22 +0000	[diff] [blame]	1624	}
				1625
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1626	/* Decrement the count of locks against this same file. When the
				1627	** count reaches zero, close any other file descriptors whose close
				1628	** was deferred because of outstanding locks.
				1629	*/
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1630	pOpen = pFile->pOpen;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1631	pOpen->nLock--;
				1632	assert( pOpen->nLock>=0 );
				1633	if( pOpen->nLock==0 && pOpen->nPending>0 ){
				1634	int i;
				1635	for(i=0; i<pOpen->nPending; i++){
				1636	close(pOpen->aPending[i]);
				1637	}
drh	64b1bea	2006-01-15 02:30:57 +0000	[diff] [blame]	1638	free(pOpen->aPending);
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1639	pOpen->nPending = 0;
				1640	pOpen->aPending = 0;
				1641	}
				1642	}
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	1643	sqlite3OsLeaveMutex();
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1644	pFile->locktype = locktype;
drh	9c105bb	2004-10-02 20:38:28 +0000	[diff] [blame]	1645	return rc;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	1646	}
				1647
				1648	/*
danielk1977	e302663	2004-06-22 11:29:02 +0000	[diff] [blame]	1649	** Close a file.
				1650	*/
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	1651	static int unixClose(OsFile **pId){
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	1652	unixFile id = (unixFile)*pId;
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	1653
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	1654	if( !id ) return SQLITE_OK;
drh	3832230	2006-01-15 02:43:16 +0000	[diff] [blame]	1655	unixUnlock(*pId, NO_LOCK);
danielk1977	e302663	2004-06-22 11:29:02 +0000	[diff] [blame]	1656	if( id->dirfd>=0 ) close(id->dirfd);
				1657	id->dirfd = -1;
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	1658	sqlite3OsEnterMutex();
danielk1977	441b09a	2006-01-05 13:48:29 +0000	[diff] [blame]	1659
drh	3832230	2006-01-15 02:43:16 +0000	[diff] [blame]	1660	if( id->pOpen->nLock ){
danielk1977	e302663	2004-06-22 11:29:02 +0000	[diff] [blame]	1661	/* If there are outstanding locks, do not actually close the file just
				1662	** yet because that would clear those locks. Instead, add the file
				1663	** descriptor to pOpen->aPending. It will be automatically closed when
				1664	** the last lock is cleared.
				1665	*/
				1666	int *aNew;
				1667	struct openCnt *pOpen = id->pOpen;
drh	64b1bea	2006-01-15 02:30:57 +0000	[diff] [blame]	1668	aNew = realloc( pOpen->aPending, (pOpen->nPending+1)*sizeof(int) );
danielk1977	e302663	2004-06-22 11:29:02 +0000	[diff] [blame]	1669	if( aNew==0 ){
				1670	/* If a malloc fails, just leak the file descriptor */
				1671	}else{
				1672	pOpen->aPending = aNew;
drh	ad81e87	2005-08-21 21:45:01 +0000	[diff] [blame]	1673	pOpen->aPending[pOpen->nPending] = id->h;
				1674	pOpen->nPending++;
danielk1977	e302663	2004-06-22 11:29:02 +0000	[diff] [blame]	1675	}
				1676	}else{
				1677	/* There are no outstanding locks so we can close the file immediately */
				1678	close(id->h);
				1679	}
				1680	releaseLockInfo(id->pLock);
				1681	releaseOpenCnt(id->pOpen);
danielk1977	441b09a	2006-01-05 13:48:29 +0000	[diff] [blame]	1682
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	1683	sqlite3OsLeaveMutex();
danielk1977	e302663	2004-06-22 11:29:02 +0000	[diff] [blame]	1684	id->isOpen = 0;
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1685	OSTRACE2("CLOSE %-3d\n", id->h);
danielk1977	e302663	2004-06-22 11:29:02 +0000	[diff] [blame]	1686	OpenCounter(-1);
danielk1977	750b03e	2006-02-14 10:48:39 +0000	[diff] [blame]	1687	sqlite3ThreadSafeFree(id);
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	1688	*pId = 0;
drh	02afc86	2006-01-20 18:10:57 +0000	[diff] [blame]	1689	return SQLITE_OK;
danielk1977	e302663	2004-06-22 11:29:02 +0000	[diff] [blame]	1690	}
				1691
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	1692
				1693	#ifdef SQLITE_ENABLE_LOCKING_STYLE
				1694	#pragma mark AFP Support
				1695
				1696	/*
				1697	** The afpLockingContext structure contains all afp lock specific state
				1698	*/
				1699	typedef struct afpLockingContext afpLockingContext;
				1700	struct afpLockingContext {
				1701	unsigned long long sharedLockByte;
				1702	char *filePath;
				1703	};
				1704
				1705	struct ByteRangeLockPB2
				1706	{
				1707	unsigned long long offset; /* offset to first byte to lock */
				1708	unsigned long long length; /* nbr of bytes to lock */
				1709	unsigned long long retRangeStart; /* nbr of 1st byte locked if successful */
				1710	unsigned char unLockFlag; /* 1 = unlock, 0 = lock */
				1711	unsigned char startEndFlag; /* 1=rel to end of fork, 0=rel to start */
				1712	int fd; /* file desc to assoc this lock with */
				1713	};
				1714
				1715	#define afpfsByteRangeLock2FSCTL _IOWR('z', 23, struct ByteRangeLockPB2)
				1716
				1717	/* return 0 on success, 1 on failure. To match the behavior of the
				1718	normal posix file locking (used in unixLock for example), we should
				1719	provide 'richer' return codes - specifically to differentiate between
				1720	'file busy' and 'file system error' results */
				1721	static int _AFPFSSetLock(const char *path, int fd, unsigned long long offset,
				1722	unsigned long long length, int setLockFlag)
				1723	{
				1724	struct ByteRangeLockPB2 pb;
				1725	int err;
				1726
				1727	pb.unLockFlag = setLockFlag ? 0 : 1;
				1728	pb.startEndFlag = 0;
				1729	pb.offset = offset;
				1730	pb.length = length;
				1731	pb.fd = fd;
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1732	OSTRACE5("AFPLOCK setting lock %s for %d in range %llx:%llx\n",
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	1733	(setLockFlag?"ON":"OFF"), fd, offset, length);
				1734	err = fsctl(path, afpfsByteRangeLock2FSCTL, &pb, 0);
				1735	if ( err==-1 ) {
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1736	OSTRACE4("AFPLOCK failed to fsctl() '%s' %d %s\n", path, errno,
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	1737	strerror(errno));
				1738	return 1; // error
				1739	} else {
				1740	return 0;
				1741	}
				1742	}
				1743
				1744	/*
				1745	** This routine checks if there is a RESERVED lock held on the specified
				1746	** file by this or any other process. If such a lock is held, return
				1747	** non-zero. If the file is unlocked or holds only SHARED locks, then
				1748	** return zero.
				1749	*/
				1750	static int afpUnixCheckReservedLock(OsFile *id){
				1751	int r = 0;
				1752	unixFile pFile = (unixFile)id;
				1753
				1754	assert( pFile );
				1755	afpLockingContext context = (afpLockingContext ) pFile->lockingContext;
				1756
				1757	/* Check if a thread in this process holds such a lock */
				1758	if( pFile->locktype>SHARED_LOCK ){
				1759	r = 1;
				1760	}
				1761
				1762	/* Otherwise see if some other process holds it.
				1763	*/
				1764	if ( !r ) {
				1765	// lock the byte
				1766	int failed = _AFPFSSetLock(context->filePath, pFile->h, RESERVED_BYTE, 1,1);
				1767	if (failed) {
				1768	/* if we failed to get the lock then someone else must have it */
				1769	r = 1;
				1770	} else {
				1771	/* if we succeeded in taking the reserved lock, unlock it to restore
				1772	** the original state */
				1773	_AFPFSSetLock(context->filePath, pFile->h, RESERVED_BYTE, 1, 0);
				1774	}
				1775	}
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1776	OSTRACE3("TEST WR-LOCK %d %d\n", pFile->h, r);
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	1777
				1778	return r;
				1779	}
				1780
				1781	/* AFP-style locking following the behavior of unixLock, see the unixLock
				1782	** function comments for details of lock management. */
				1783	static int afpUnixLock(OsFile *id, int locktype)
				1784	{
				1785	int rc = SQLITE_OK;
				1786	unixFile pFile = (unixFile)id;
				1787	afpLockingContext context = (afpLockingContext ) pFile->lockingContext;
				1788	int gotPendingLock = 0;
				1789
				1790	assert( pFile );
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1791	OSTRACE5("LOCK %d %s was %s pid=%d\n", pFile->h,
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	1792	locktypeName(locktype), locktypeName(pFile->locktype), getpid());
				1793	/* If there is already a lock of this type or more restrictive on the
				1794	** OsFile, do nothing. Don't use the afp_end_lock: exit path, as
				1795	** sqlite3OsEnterMutex() hasn't been called yet.
				1796	*/
				1797	if( pFile->locktype>=locktype ){
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1798	OSTRACE3("LOCK %d %s ok (already held)\n", pFile->h,
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	1799	locktypeName(locktype));
				1800	return SQLITE_OK;
				1801	}
				1802
				1803	/* Make sure the locking sequence is correct
				1804	*/
				1805	assert( pFile->locktype!=NO_LOCK \|\| locktype==SHARED_LOCK );
				1806	assert( locktype!=PENDING_LOCK );
				1807	assert( locktype!=RESERVED_LOCK \|\| pFile->locktype==SHARED_LOCK );
				1808
				1809	/* This mutex is needed because pFile->pLock is shared across threads
				1810	*/
				1811	sqlite3OsEnterMutex();
				1812
				1813	/* Make sure the current thread owns the pFile.
				1814	*/
				1815	rc = transferOwnership(pFile);
				1816	if( rc!=SQLITE_OK ){
				1817	sqlite3OsLeaveMutex();
				1818	return rc;
				1819	}
				1820
				1821	/* A PENDING lock is needed before acquiring a SHARED lock and before
				1822	** acquiring an EXCLUSIVE lock. For the SHARED lock, the PENDING will
				1823	** be released.
				1824	*/
				1825	if( locktype==SHARED_LOCK
				1826	\|\| (locktype==EXCLUSIVE_LOCK && pFile->locktype<PENDING_LOCK)
				1827	){
				1828	int failed = _AFPFSSetLock(context->filePath, pFile->h,
				1829	PENDING_BYTE, 1, 1);
				1830	if (failed) {
				1831	rc = SQLITE_BUSY;
				1832	goto afp_end_lock;
				1833	}
				1834	}
				1835
				1836	/* If control gets to this point, then actually go ahead and make
				1837	** operating system calls for the specified lock.
				1838	*/
				1839	if( locktype==SHARED_LOCK ){
				1840	int lk, failed;
				1841	int tries = 0;
				1842
				1843	/* Now get the read-lock */
				1844	/* note that the quality of the randomness doesn't matter that much */
				1845	lk = random();
				1846	context->sharedLockByte = (lk & 0x7fffffff)%(SHARED_SIZE - 1);
				1847	failed = _AFPFSSetLock(context->filePath, pFile->h,
				1848	SHARED_FIRST+context->sharedLockByte, 1, 1);
				1849
				1850	/* Drop the temporary PENDING lock */
				1851	if (_AFPFSSetLock(context->filePath, pFile->h, PENDING_BYTE, 1, 0)) {
				1852	rc = SQLITE_IOERR_UNLOCK; /* This should never happen */
				1853	goto afp_end_lock;
				1854	}
				1855
				1856	if( failed ){
				1857	rc = SQLITE_BUSY;
				1858	} else {
				1859	pFile->locktype = SHARED_LOCK;
				1860	}
				1861	}else{
				1862	/* The request was for a RESERVED or EXCLUSIVE lock. It is
				1863	** assumed that there is a SHARED or greater lock on the file
				1864	** already.
				1865	*/
				1866	int failed = 0;
				1867	assert( 0!=pFile->locktype );
				1868	if (locktype >= RESERVED_LOCK && pFile->locktype < RESERVED_LOCK) {
				1869	/* Acquire a RESERVED lock */
				1870	failed = _AFPFSSetLock(context->filePath, pFile->h, RESERVED_BYTE, 1,1);
				1871	}
				1872	if (!failed && locktype == EXCLUSIVE_LOCK) {
				1873	/* Acquire an EXCLUSIVE lock */
				1874
				1875	/* Remove the shared lock before trying the range. we'll need to
				1876	** reestablish the shared lock if we can't get the afpUnixUnlock
				1877	*/
				1878	if (!_AFPFSSetLock(context->filePath, pFile->h, SHARED_FIRST +
				1879	context->sharedLockByte, 1, 0)) {
				1880	/* now attemmpt to get the exclusive lock range */
				1881	failed = _AFPFSSetLock(context->filePath, pFile->h, SHARED_FIRST,
				1882	SHARED_SIZE, 1);
				1883	if (failed && _AFPFSSetLock(context->filePath, pFile->h, SHARED_FIRST +
				1884	context->sharedLockByte, 1, 1)) {
				1885	rc = SQLITE_IOERR_RDLOCK; /* this should never happen */
				1886	}
				1887	} else {
				1888	/* */
				1889	rc = SQLITE_IOERR_UNLOCK; /* this should never happen */
				1890	}
				1891	}
				1892	if( failed && rc == SQLITE_OK){
				1893	rc = SQLITE_BUSY;
				1894	}
				1895	}
				1896
				1897	if( rc==SQLITE_OK ){
				1898	pFile->locktype = locktype;
				1899	}else if( locktype==EXCLUSIVE_LOCK ){
				1900	pFile->locktype = PENDING_LOCK;
				1901	}
				1902
				1903	afp_end_lock:
				1904	sqlite3OsLeaveMutex();
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1905	OSTRACE4("LOCK %d %s %s\n", pFile->h, locktypeName(locktype),
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	1906	rc==SQLITE_OK ? "ok" : "failed");
				1907	return rc;
				1908	}
				1909
				1910	/*
				1911	** Lower the locking level on file descriptor pFile to locktype. locktype
				1912	** must be either NO_LOCK or SHARED_LOCK.
				1913	**
				1914	** If the locking level of the file descriptor is already at or below
				1915	** the requested locking level, this routine is a no-op.
				1916	*/
				1917	static int afpUnixUnlock(OsFile *id, int locktype) {
				1918	struct flock lock;
				1919	int rc = SQLITE_OK;
				1920	unixFile pFile = (unixFile)id;
				1921	afpLockingContext context = (afpLockingContext ) pFile->lockingContext;
				1922
				1923	assert( pFile );
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	1924	OSTRACE5("UNLOCK %d %d was %d pid=%d\n", pFile->h, locktype,
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	1925	pFile->locktype, getpid());
				1926
				1927	assert( locktype<=SHARED_LOCK );
				1928	if( pFile->locktype<=locktype ){
				1929	return SQLITE_OK;
				1930	}
				1931	if( CHECK_THREADID(pFile) ){
				1932	return SQLITE_MISUSE;
				1933	}
				1934	sqlite3OsEnterMutex();
				1935	if( pFile->locktype>SHARED_LOCK ){
				1936	if( locktype==SHARED_LOCK ){
				1937	int failed = 0;
				1938
				1939	/* unlock the exclusive range - then re-establish the shared lock */
				1940	if (pFile->locktype==EXCLUSIVE_LOCK) {
				1941	failed = _AFPFSSetLock(context->filePath, pFile->h, SHARED_FIRST,
				1942	SHARED_SIZE, 0);
				1943	if (!failed) {
				1944	/* successfully removed the exclusive lock */
				1945	if (_AFPFSSetLock(context->filePath, pFile->h, SHARED_FIRST+
				1946	context->sharedLockByte, 1, 1)) {
				1947	/* failed to re-establish our shared lock */
				1948	rc = SQLITE_IOERR_RDLOCK; /* This should never happen */
				1949	}
				1950	} else {
				1951	/* This should never happen - failed to unlock the exclusive range */
				1952	rc = SQLITE_IOERR_UNLOCK;
				1953	}
				1954	}
				1955	}
				1956	if (rc == SQLITE_OK && pFile->locktype>=PENDING_LOCK) {
				1957	if (_AFPFSSetLock(context->filePath, pFile->h, PENDING_BYTE, 1, 0)){
				1958	/* failed to release the pending lock */
				1959	rc = SQLITE_IOERR_UNLOCK; /* This should never happen */
				1960	}
				1961	}
				1962	if (rc == SQLITE_OK && pFile->locktype>=RESERVED_LOCK) {
				1963	if (_AFPFSSetLock(context->filePath, pFile->h, RESERVED_BYTE, 1, 0)) {
				1964	/* failed to release the reserved lock */
				1965	rc = SQLITE_IOERR_UNLOCK; /* This should never happen */
				1966	}
				1967	}
				1968	}
				1969	if( locktype==NO_LOCK ){
				1970	int failed = _AFPFSSetLock(context->filePath, pFile->h,
				1971	SHARED_FIRST + context->sharedLockByte, 1, 0);
				1972	if (failed) {
				1973	rc = SQLITE_IOERR_UNLOCK; /* This should never happen */
				1974	}
				1975	}
				1976	if (rc == SQLITE_OK)
				1977	pFile->locktype = locktype;
				1978	sqlite3OsLeaveMutex();
				1979	return rc;
				1980	}
				1981
				1982	/*
				1983	** Close a file & cleanup AFP specific locking context
				1984	*/
				1985	static int afpUnixClose(OsFile **pId) {
				1986	unixFile id = (unixFile)*pId;
				1987
				1988	if( !id ) return SQLITE_OK;
				1989	afpUnixUnlock(*pId, NO_LOCK);
				1990	/* free the AFP locking structure */
				1991	if (id->lockingContext != NULL) {
				1992	if (((afpLockingContext *)id->lockingContext)->filePath != NULL)
				1993	sqlite3ThreadSafeFree(((afpLockingContext*)id->lockingContext)->filePath);
				1994	sqlite3ThreadSafeFree(id->lockingContext);
				1995	}
				1996
				1997	if( id->dirfd>=0 ) close(id->dirfd);
				1998	id->dirfd = -1;
				1999	close(id->h);
				2000	id->isOpen = 0;
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	2001	OSTRACE2("CLOSE %-3d\n", id->h);
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2002	OpenCounter(-1);
				2003	sqlite3ThreadSafeFree(id);
				2004	*pId = 0;
				2005	return SQLITE_OK;
				2006	}
				2007
				2008
				2009	#pragma mark flock() style locking
				2010
				2011	/*
				2012	** The flockLockingContext is not used
				2013	*/
				2014	typedef void flockLockingContext;
				2015
				2016	static int flockUnixCheckReservedLock(OsFile *id) {
				2017	unixFile pFile = (unixFile)id;
				2018
				2019	if (pFile->locktype == RESERVED_LOCK) {
				2020	return 1; // already have a reserved lock
				2021	} else {
				2022	// attempt to get the lock
				2023	int rc = flock(pFile->h, LOCK_EX \| LOCK_NB);
				2024	if (!rc) {
				2025	// got the lock, unlock it
				2026	flock(pFile->h, LOCK_UN);
				2027	return 0; // no one has it reserved
				2028	}
				2029	return 1; // someone else might have it reserved
				2030	}
				2031	}
				2032
				2033	static int flockUnixLock(OsFile *id, int locktype) {
				2034	unixFile pFile = (unixFile)id;
				2035
				2036	// if we already have a lock, it is exclusive.
				2037	// Just adjust level and punt on outta here.
				2038	if (pFile->locktype > NO_LOCK) {
				2039	pFile->locktype = locktype;
				2040	return SQLITE_OK;
				2041	}
				2042
				2043	// grab an exclusive lock
				2044	int rc = flock(pFile->h, LOCK_EX \| LOCK_NB);
				2045	if (rc) {
				2046	// didn't get, must be busy
				2047	return SQLITE_BUSY;
				2048	} else {
				2049	// got it, set the type and return ok
				2050	pFile->locktype = locktype;
				2051	return SQLITE_OK;
				2052	}
				2053	}
				2054
				2055	static int flockUnixUnlock(OsFile *id, int locktype) {
				2056	unixFile pFile = (unixFile)id;
				2057
				2058	assert( locktype<=SHARED_LOCK );
				2059
				2060	// no-op if possible
				2061	if( pFile->locktype==locktype ){
				2062	return SQLITE_OK;
				2063	}
				2064
				2065	// shared can just be set because we always have an exclusive
				2066	if (locktype==SHARED_LOCK) {
				2067	pFile->locktype = locktype;
				2068	return SQLITE_OK;
				2069	}
				2070
				2071	// no, really, unlock.
				2072	int rc = flock(pFile->h, LOCK_UN);
				2073	if (rc)
				2074	return SQLITE_IOERR_UNLOCK;
				2075	else {
				2076	pFile->locktype = NO_LOCK;
				2077	return SQLITE_OK;
				2078	}
				2079	}
				2080
				2081	/*
				2082	** Close a file.
				2083	*/
				2084	static int flockUnixClose(OsFile **pId) {
				2085	unixFile id = (unixFile)*pId;
				2086
				2087	if( !id ) return SQLITE_OK;
				2088	flockUnixUnlock(*pId, NO_LOCK);
				2089
				2090	if( id->dirfd>=0 ) close(id->dirfd);
				2091	id->dirfd = -1;
				2092	sqlite3OsEnterMutex();
				2093
				2094	close(id->h);
				2095	sqlite3OsLeaveMutex();
				2096	id->isOpen = 0;
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	2097	OSTRACE2("CLOSE %-3d\n", id->h);
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2098	OpenCounter(-1);
				2099	sqlite3ThreadSafeFree(id);
				2100	*pId = 0;
				2101	return SQLITE_OK;
				2102	}
				2103
				2104	#pragma mark Old-School .lock file based locking
				2105
				2106	/*
				2107	** The dotlockLockingContext structure contains all dotlock (.lock) lock
				2108	** specific state
				2109	*/
				2110	typedef struct dotlockLockingContext dotlockLockingContext;
				2111	struct dotlockLockingContext {
				2112	char *lockPath;
				2113	};
				2114
				2115
				2116	static int dotlockUnixCheckReservedLock(OsFile *id) {
				2117	unixFile pFile = (unixFile)id;
				2118	dotlockLockingContext *context =
				2119	(dotlockLockingContext *) pFile->lockingContext;
				2120
				2121	if (pFile->locktype == RESERVED_LOCK) {
				2122	return 1; // already have a reserved lock
				2123	} else {
				2124	struct stat statBuf;
				2125	if (lstat(context->lockPath,&statBuf) == 0)
				2126	// file exists, someone else has the lock
				2127	return 1;
				2128	else
				2129	// file does not exist, we could have it if we want it
				2130	return 0;
				2131	}
				2132	}
				2133
				2134	static int dotlockUnixLock(OsFile *id, int locktype) {
				2135	unixFile pFile = (unixFile)id;
				2136	dotlockLockingContext *context =
				2137	(dotlockLockingContext *) pFile->lockingContext;
				2138
				2139	// if we already have a lock, it is exclusive.
				2140	// Just adjust level and punt on outta here.
				2141	if (pFile->locktype > NO_LOCK) {
				2142	pFile->locktype = locktype;
				2143
				2144	/* Always update the timestamp on the old file */
				2145	utimes(context->lockPath,NULL);
				2146	return SQLITE_OK;
				2147	}
				2148
				2149	// check to see if lock file already exists
				2150	struct stat statBuf;
				2151	if (lstat(context->lockPath,&statBuf) == 0){
				2152	return SQLITE_BUSY; // it does, busy
				2153	}
				2154
				2155	// grab an exclusive lock
				2156	int fd = open(context->lockPath,O_RDONLY\|O_CREAT\|O_EXCL,0600);
				2157	if (fd < 0) {
				2158	// failed to open/create the file, someone else may have stolen the lock
				2159	return SQLITE_BUSY;
				2160	}
				2161	close(fd);
				2162
				2163	// got it, set the type and return ok
				2164	pFile->locktype = locktype;
				2165	return SQLITE_OK;
				2166	}
				2167
				2168	static int dotlockUnixUnlock(OsFile *id, int locktype) {
				2169	unixFile pFile = (unixFile)id;
				2170	dotlockLockingContext *context =
				2171	(dotlockLockingContext *) pFile->lockingContext;
				2172
				2173	assert( locktype<=SHARED_LOCK );
				2174
				2175	// no-op if possible
				2176	if( pFile->locktype==locktype ){
				2177	return SQLITE_OK;
				2178	}
				2179
				2180	// shared can just be set because we always have an exclusive
				2181	if (locktype==SHARED_LOCK) {
				2182	pFile->locktype = locktype;
				2183	return SQLITE_OK;
				2184	}
				2185
				2186	// no, really, unlock.
				2187	unlink(context->lockPath);
				2188	pFile->locktype = NO_LOCK;
				2189	return SQLITE_OK;
				2190	}
				2191
				2192	/*
				2193	** Close a file.
				2194	*/
				2195	static int dotlockUnixClose(OsFile **pId) {
				2196	unixFile id = (unixFile)*pId;
				2197
				2198	if( !id ) return SQLITE_OK;
				2199	dotlockUnixUnlock(*pId, NO_LOCK);
				2200	/* free the dotlock locking structure */
				2201	if (id->lockingContext != NULL) {
				2202	if (((dotlockLockingContext *)id->lockingContext)->lockPath != NULL)
				2203	sqlite3ThreadSafeFree( ( (dotlockLockingContext *)
				2204	id->lockingContext)->lockPath);
				2205	sqlite3ThreadSafeFree(id->lockingContext);
				2206	}
				2207
				2208	if( id->dirfd>=0 ) close(id->dirfd);
				2209	id->dirfd = -1;
				2210	sqlite3OsEnterMutex();
				2211
				2212	close(id->h);
				2213
				2214	sqlite3OsLeaveMutex();
				2215	id->isOpen = 0;
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	2216	OSTRACE2("CLOSE %-3d\n", id->h);
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2217	OpenCounter(-1);
				2218	sqlite3ThreadSafeFree(id);
				2219	*pId = 0;
				2220	return SQLITE_OK;
				2221	}
				2222
				2223
				2224	#pragma mark No locking
				2225
				2226	/*
				2227	** The nolockLockingContext is void
				2228	*/
				2229	typedef void nolockLockingContext;
				2230
				2231	static int nolockUnixCheckReservedLock(OsFile *id) {
				2232	return 0;
				2233	}
				2234
				2235	static int nolockUnixLock(OsFile *id, int locktype) {
				2236	return SQLITE_OK;
				2237	}
				2238
				2239	static int nolockUnixUnlock(OsFile *id, int locktype) {
				2240	return SQLITE_OK;
				2241	}
				2242
				2243	/*
				2244	** Close a file.
				2245	*/
				2246	static int nolockUnixClose(OsFile **pId) {
				2247	unixFile id = (unixFile)*pId;
				2248
				2249	if( !id ) return SQLITE_OK;
				2250	if( id->dirfd>=0 ) close(id->dirfd);
				2251	id->dirfd = -1;
				2252	sqlite3OsEnterMutex();
				2253
				2254	close(id->h);
				2255
				2256	sqlite3OsLeaveMutex();
				2257	id->isOpen = 0;
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	2258	OSTRACE2("CLOSE %-3d\n", id->h);
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2259	OpenCounter(-1);
				2260	sqlite3ThreadSafeFree(id);
				2261	*pId = 0;
				2262	return SQLITE_OK;
				2263	}
				2264
				2265	#endif /* SQLITE_ENABLE_LOCKING_STYLE */
				2266
danielk1977	e302663	2004-06-22 11:29:02 +0000	[diff] [blame]	2267	/*
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	2268	** Turn a relative pathname into a full pathname. Return a pointer
				2269	** to the full pathname stored in space obtained from sqliteMalloc().
				2270	** The calling function is responsible for freeing this space once it
				2271	** is no longer needed.
				2272	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	2273	char sqlite3UnixFullPathname(const char zRelative){
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	2274	char *zFull = 0;
				2275	if( zRelative[0]=='/' ){
				2276	sqlite3SetString(&zFull, zRelative, (char*)0);
				2277	}else{
drh	79158e1	2005-09-06 21:40:45 +0000	[diff] [blame]	2278	char *zBuf = sqliteMalloc(5000);
				2279	if( zBuf==0 ){
				2280	return 0;
				2281	}
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	2282	zBuf[0] = 0;
drh	79158e1	2005-09-06 21:40:45 +0000	[diff] [blame]	2283	sqlite3SetString(&zFull, getcwd(zBuf, 5000), "/", zRelative,
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	2284	(char*)0);
drh	79158e1	2005-09-06 21:40:45 +0000	[diff] [blame]	2285	sqliteFree(zBuf);
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	2286	}
drh	4eb9a97	2006-02-13 18:42:21 +0000	[diff] [blame]	2287
				2288	#if 0
drh	89ea931	2006-02-13 17:03:47 +0000	[diff] [blame]	2289	/*
				2290	** Remove "/./" path elements and convert "/A/./" path elements
				2291	** to just "/".
				2292	*/
				2293	if( zFull ){
drh	4eb9a97	2006-02-13 18:42:21 +0000	[diff] [blame]	2294	int i, j;
drh	89ea931	2006-02-13 17:03:47 +0000	[diff] [blame]	2295	for(i=j=0; zFull[i]; i++){
				2296	if( zFull[i]=='/' ){
				2297	if( zFull[i+1]=='/' ) continue;
				2298	if( zFull[i+1]=='.' && zFull[i+2]=='/' ){
				2299	i += 1;
				2300	continue;
				2301	}
				2302	if( zFull[i+1]=='.' && zFull[i+2]=='.' && zFull[i+3]=='/' ){
				2303	while( j>0 && zFull[j-1]!='/' ){ j--; }
				2304	i += 3;
				2305	continue;
				2306	}
				2307	}
				2308	zFull[j++] = zFull[i];
				2309	}
				2310	zFull[j] = 0;
				2311	}
drh	4eb9a97	2006-02-13 18:42:21 +0000	[diff] [blame]	2312	#endif
				2313
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	2314	return zFull;
				2315	}
				2316
drh	1883921	2005-11-26 03:43:23 +0000	[diff] [blame]	2317	/*
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	2318	** Change the value of the fullsync flag in the given file descriptor.
drh	1883921	2005-11-26 03:43:23 +0000	[diff] [blame]	2319	*/
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	2320	static void unixSetFullSync(OsFile *id, int v){
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2321	((unixFile*)id)->fullSync = v;
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	2322	}
				2323
				2324	/*
				2325	** Return the underlying file handle for an OsFile
				2326	*/
				2327	static int unixFileHandle(OsFile *id){
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2328	return ((unixFile*)id)->h;
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	2329	}
				2330
				2331	/*
				2332	** Return an integer that indices the type of lock currently held
				2333	** by this handle. (Used for testing and analysis only.)
				2334	*/
				2335	static int unixLockState(OsFile *id){
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2336	return ((unixFile*)id)->locktype;
drh	1883921	2005-11-26 03:43:23 +0000	[diff] [blame]	2337	}
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	2338
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	2339	/*
danielk1977	a3d4c88	2007-03-23 10:08:38 +0000	[diff] [blame]	2340	** Return the sector size in bytes of the underlying block device for
				2341	** the specified file. This is almost always 512 bytes, but may be
				2342	** larger for some devices.
				2343	**
				2344	** SQLite code assumes this function cannot fail. It also assumes that
				2345	** if two files are created in the same file-system directory (i.e.
				2346	** a database and it's journal file) that the sector size will be the
				2347	** same for both.
				2348	*/
				2349	static int unixSectorSize(OsFile *id){
drh	3ceeb75	2007-03-29 18:19:52 +0000	[diff] [blame]	2350	return SQLITE_DEFAULT_SECTOR_SIZE;
danielk1977	a3d4c88	2007-03-23 10:08:38 +0000	[diff] [blame]	2351	}
				2352
				2353	/*
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2354	** This vector defines all the methods that can operate on an OsFile
				2355	** for unix.
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	2356	*/
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2357	static const IoMethod sqlite3UnixIoMethod = {
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	2358	unixClose,
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2359	unixOpenDirectory,
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	2360	unixRead,
				2361	unixWrite,
				2362	unixSeek,
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	2363	unixTruncate,
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2364	unixSync,
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	2365	unixSetFullSync,
				2366	unixFileHandle,
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2367	unixFileSize,
				2368	unixLock,
				2369	unixUnlock,
drh	9cbe635	2005-11-29 03:13:21 +0000	[diff] [blame]	2370	unixLockState,
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2371	unixCheckReservedLock,
danielk1977	a3d4c88	2007-03-23 10:08:38 +0000	[diff] [blame]	2372	unixSectorSize,
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	2373	};
				2374
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2375	#ifdef SQLITE_ENABLE_LOCKING_STYLE
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2376	/*
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2377	** This vector defines all the methods that can operate on an OsFile
				2378	** for unix with AFP style file locking.
				2379	*/
				2380	static const IoMethod sqlite3AFPLockingUnixIoMethod = {
				2381	afpUnixClose,
				2382	unixOpenDirectory,
				2383	unixRead,
				2384	unixWrite,
				2385	unixSeek,
				2386	unixTruncate,
				2387	unixSync,
				2388	unixSetFullSync,
				2389	unixFileHandle,
				2390	unixFileSize,
				2391	afpUnixLock,
				2392	afpUnixUnlock,
				2393	unixLockState,
				2394	afpUnixCheckReservedLock,
danielk1977	a3d4c88	2007-03-23 10:08:38 +0000	[diff] [blame]	2395	unixSectorSize,
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2396	};
				2397
				2398	/*
				2399	** This vector defines all the methods that can operate on an OsFile
				2400	** for unix with flock() style file locking.
				2401	*/
				2402	static const IoMethod sqlite3FlockLockingUnixIoMethod = {
				2403	flockUnixClose,
				2404	unixOpenDirectory,
				2405	unixRead,
				2406	unixWrite,
				2407	unixSeek,
				2408	unixTruncate,
				2409	unixSync,
				2410	unixSetFullSync,
				2411	unixFileHandle,
				2412	unixFileSize,
				2413	flockUnixLock,
				2414	flockUnixUnlock,
				2415	unixLockState,
				2416	flockUnixCheckReservedLock,
danielk1977	a3d4c88	2007-03-23 10:08:38 +0000	[diff] [blame]	2417	unixSectorSize,
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2418	};
				2419
				2420	/*
				2421	** This vector defines all the methods that can operate on an OsFile
				2422	** for unix with dotlock style file locking.
				2423	*/
				2424	static const IoMethod sqlite3DotlockLockingUnixIoMethod = {
				2425	dotlockUnixClose,
				2426	unixOpenDirectory,
				2427	unixRead,
				2428	unixWrite,
				2429	unixSeek,
				2430	unixTruncate,
				2431	unixSync,
				2432	unixSetFullSync,
				2433	unixFileHandle,
				2434	unixFileSize,
				2435	dotlockUnixLock,
				2436	dotlockUnixUnlock,
				2437	unixLockState,
				2438	dotlockUnixCheckReservedLock,
danielk1977	a3d4c88	2007-03-23 10:08:38 +0000	[diff] [blame]	2439	unixSectorSize,
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2440	};
				2441
				2442	/*
				2443	** This vector defines all the methods that can operate on an OsFile
				2444	** for unix with dotlock style file locking.
				2445	*/
				2446	static const IoMethod sqlite3NolockLockingUnixIoMethod = {
				2447	nolockUnixClose,
				2448	unixOpenDirectory,
				2449	unixRead,
				2450	unixWrite,
				2451	unixSeek,
				2452	unixTruncate,
				2453	unixSync,
				2454	unixSetFullSync,
				2455	unixFileHandle,
				2456	unixFileSize,
				2457	nolockUnixLock,
				2458	nolockUnixUnlock,
				2459	unixLockState,
				2460	nolockUnixCheckReservedLock,
danielk1977	a3d4c88	2007-03-23 10:08:38 +0000	[diff] [blame]	2461	unixSectorSize,
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2462	};
				2463
				2464	#endif /* SQLITE_ENABLE_LOCKING_STYLE */
				2465
				2466	/*
				2467	** Allocate memory for a new unixFile and initialize that unixFile.
				2468	** Write a pointer to the new unixFile into *pId.
				2469	** If we run out of memory, close the file and return an error.
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2470	*/
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2471	#ifdef SQLITE_ENABLE_LOCKING_STYLE
				2472	/*
				2473	** When locking extensions are enabled, the filepath and locking style
				2474	** are needed to determine the unixFile pMethod to use for locking operations.
				2475	** The locking-style specific lockingContext data structure is created
				2476	** and assigned here also.
				2477	*/
				2478	static int allocateUnixFile(
				2479	int h, /* Open file descriptor of file being opened */
				2480	OsFile *pId, / Write completed initialization here */
				2481	const char zFilename, / Name of the file being opened */
				2482	int delFlag /* Delete-on-or-before-close flag */
				2483	){
aswift	108bc32	2006-10-11 17:19:46 +0000	[diff] [blame]	2484	sqlite3LockingStyle lockingStyle;
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2485	unixFile *pNew;
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2486	unixFile f;
				2487	int rc;
				2488
drh	61fc595	2007-04-01 23:49:51 +0000	[diff] [blame^]	2489	memset(&f, 0, sizeof(f));
aswift	448aa6f	2006-11-11 01:31:58 +0000	[diff] [blame]	2490	lockingStyle = sqlite3DetectLockingStyle(zFilename, h);
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2491	if ( lockingStyle == posixLockingStyle ) {
				2492	sqlite3OsEnterMutex();
				2493	rc = findLockInfo(h, &f.pLock, &f.pOpen);
				2494	sqlite3OsLeaveMutex();
				2495	if( rc ){
				2496	close(h);
				2497	unlink(zFilename);
				2498	return SQLITE_NOMEM;
				2499	}
				2500	} else {
				2501	// pLock and pOpen are only used for posix advisory locking
				2502	f.pLock = NULL;
				2503	f.pOpen = NULL;
				2504	}
				2505	if( delFlag ){
				2506	unlink(zFilename);
				2507	}
				2508	f.dirfd = -1;
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2509	f.h = h;
				2510	SET_THREADID(&f);
danielk1977	750b03e	2006-02-14 10:48:39 +0000	[diff] [blame]	2511	pNew = sqlite3ThreadSafeMalloc( sizeof(unixFile) );
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2512	if( pNew==0 ){
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2513	close(h);
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	2514	sqlite3OsEnterMutex();
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2515	releaseLockInfo(f.pLock);
				2516	releaseOpenCnt(f.pOpen);
drh	029b44b	2006-01-15 00:13:15 +0000	[diff] [blame]	2517	sqlite3OsLeaveMutex();
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2518	*pId = 0;
				2519	return SQLITE_NOMEM;
				2520	}else{
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2521	*pNew = f;
aswift	108bc32	2006-10-11 17:19:46 +0000	[diff] [blame]	2522	switch(lockingStyle) {
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2523	case afpLockingStyle:
				2524	/* afp locking uses the file path so it needs to be included in
				2525	** the afpLockingContext */
				2526	pNew->pMethod = &sqlite3AFPLockingUnixIoMethod;
				2527	pNew->lockingContext =
				2528	sqlite3ThreadSafeMalloc(sizeof(afpLockingContext));
				2529	((afpLockingContext *)pNew->lockingContext)->filePath =
				2530	sqlite3ThreadSafeMalloc(strlen(zFilename) + 1);
				2531	strcpy(((afpLockingContext *)pNew->lockingContext)->filePath,
				2532	zFilename);
				2533	srandomdev();
				2534	break;
				2535	case flockLockingStyle:
				2536	/* flock locking doesn't need additional lockingContext information */
				2537	pNew->pMethod = &sqlite3FlockLockingUnixIoMethod;
				2538	break;
				2539	case dotlockLockingStyle:
				2540	/* dotlock locking uses the file path so it needs to be included in
				2541	** the dotlockLockingContext */
				2542	pNew->pMethod = &sqlite3DotlockLockingUnixIoMethod;
				2543	pNew->lockingContext = sqlite3ThreadSafeMalloc(
				2544	sizeof(dotlockLockingContext));
				2545	((dotlockLockingContext *)pNew->lockingContext)->lockPath =
				2546	sqlite3ThreadSafeMalloc(strlen(zFilename) + strlen(".lock") + 1);
				2547	sprintf(((dotlockLockingContext *)pNew->lockingContext)->lockPath,
				2548	"%s.lock", zFilename);
				2549	break;
				2550	case posixLockingStyle:
				2551	/* posix locking doesn't need additional lockingContext information */
				2552	pNew->pMethod = &sqlite3UnixIoMethod;
				2553	break;
				2554	case noLockingStyle:
				2555	case unsupportedLockingStyle:
				2556	default:
				2557	pNew->pMethod = &sqlite3NolockLockingUnixIoMethod;
				2558	}
				2559	pId = (OsFile)pNew;
				2560	OpenCounter(+1);
				2561	return SQLITE_OK;
				2562	}
				2563	}
				2564	#else /* SQLITE_ENABLE_LOCKING_STYLE */
				2565	static int allocateUnixFile(
				2566	int h, /* Open file descriptor on file being opened */
				2567	OsFile *pId, / Write the resul unixFile structure here */
				2568	const char zFilename, / Name of the file being opened */
				2569	int delFlag /* If true, delete the file on or before closing */
				2570	){
				2571	unixFile *pNew;
				2572	unixFile f;
				2573	int rc;
				2574
drh	61fc595	2007-04-01 23:49:51 +0000	[diff] [blame^]	2575	memset(&f, 0, sizeof(f));
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2576	sqlite3OsEnterMutex();
				2577	rc = findLockInfo(h, &f.pLock, &f.pOpen);
				2578	sqlite3OsLeaveMutex();
				2579	if( delFlag ){
				2580	unlink(zFilename);
				2581	}
				2582	if( rc ){
				2583	close(h);
				2584	return SQLITE_NOMEM;
				2585	}
drh	4f0c587	2007-03-26 22:05:01 +0000	[diff] [blame]	2586	OSTRACE3("OPEN %-3d %s\n", h, zFilename);
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2587	f.dirfd = -1;
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2588	f.h = h;
				2589	SET_THREADID(&f);
				2590	pNew = sqlite3ThreadSafeMalloc( sizeof(unixFile) );
				2591	if( pNew==0 ){
				2592	close(h);
				2593	sqlite3OsEnterMutex();
				2594	releaseLockInfo(f.pLock);
				2595	releaseOpenCnt(f.pOpen);
				2596	sqlite3OsLeaveMutex();
				2597	*pId = 0;
				2598	return SQLITE_NOMEM;
				2599	}else{
				2600	*pNew = f;
drh	054889e	2005-11-30 03:20:31 +0000	[diff] [blame]	2601	pNew->pMethod = &sqlite3UnixIoMethod;
				2602	pId = (OsFile)pNew;
				2603	OpenCounter(+1);
				2604	return SQLITE_OK;
				2605	}
				2606	}
drh	bfe6631	2006-10-03 17:40:40 +0000	[diff] [blame]	2607	#endif /* SQLITE_ENABLE_LOCKING_STYLE */
drh	9c06c95	2005-11-26 00:25:00 +0000	[diff] [blame]	2608
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	2609	#endif /* SQLITE_OMIT_DISKIO */
				2610	/***************************************************************************
				2611	** Everything above deals with file I/O. Everything that follows deals
				2612	** with other miscellanous aspects of the operating system interface
				2613	****************************************************************************/
				2614
				2615
drh	761df87	2006-12-21 01:29:22 +0000	[diff] [blame]	2616	#ifndef SQLITE_OMIT_LOAD_EXTENSION
				2617	/*
				2618	** Interfaces for opening a shared library, finding entry points
				2619	** within the shared library, and closing the shared library.
				2620	*/
				2621	#include <dlfcn.h>
				2622	void sqlite3UnixDlopen(const char zFilename){
				2623	return dlopen(zFilename, RTLD_NOW \| RTLD_GLOBAL);
				2624	}
				2625	void sqlite3UnixDlsym(void pHandle, const char *zSymbol){
				2626	return dlsym(pHandle, zSymbol);
				2627	}
				2628	int sqlite3UnixDlclose(void *pHandle){
				2629	return dlclose(pHandle);
				2630	}
				2631	#endif /* SQLITE_OMIT_LOAD_EXTENSION */
				2632
drh	0ccebe7	2005-06-07 22:22:50 +0000	[diff] [blame]	2633	/*
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2634	** Get information to seed the random number generator. The seed
				2635	** is written into the buffer zBuf[256]. The calling function must
				2636	** supply a sufficiently large buffer.
				2637	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	2638	int sqlite3UnixRandomSeed(char *zBuf){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2639	/* We have to initialize zBuf to prevent valgrind from reporting
				2640	** errors. The reports issued by valgrind are incorrect - we would
				2641	** prefer that the randomness be increased by making use of the
				2642	** uninitialized space in zBuf - but valgrind errors tend to worry
				2643	** some users. Rather than argue, it seems easier just to initialize
				2644	** the whole array and silence valgrind, even if that means less randomness
				2645	** in the random seed.
				2646	**
				2647	** When testing, initializing zBuf[] to zero is all we do. That means
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	2648	** that we always use the same random number sequence. This makes the
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2649	** tests repeatable.
				2650	*/
				2651	memset(zBuf, 0, 256);
				2652	#if !defined(SQLITE_TEST)
				2653	{
drh	842b864	2005-01-21 17:53:17 +0000	[diff] [blame]	2654	int pid, fd;
				2655	fd = open("/dev/urandom", O_RDONLY);
				2656	if( fd<0 ){
drh	0739723	2006-01-06 14:46:46 +0000	[diff] [blame]	2657	time_t t;
				2658	time(&t);
				2659	memcpy(zBuf, &t, sizeof(t));
drh	842b864	2005-01-21 17:53:17 +0000	[diff] [blame]	2660	pid = getpid();
				2661	memcpy(&zBuf[sizeof(time_t)], &pid, sizeof(pid));
				2662	}else{
				2663	read(fd, zBuf, 256);
				2664	close(fd);
				2665	}
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2666	}
				2667	#endif
				2668	return SQLITE_OK;
				2669	}
				2670
				2671	/*
				2672	** Sleep for a little while. Return the amount of time slept.
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	2673	** The argument is the number of milliseconds we want to sleep.
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2674	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	2675	int sqlite3UnixSleep(int ms){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2676	#if defined(HAVE_USLEEP) && HAVE_USLEEP
				2677	usleep(ms*1000);
				2678	return ms;
				2679	#else
				2680	sleep((ms+999)/1000);
				2681	return 1000*((ms+999)/1000);
				2682	#endif
				2683	}
				2684
				2685	/*
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2686	** Static variables used for thread synchronization.
				2687	**
				2688	** inMutex the nesting depth of the recursive mutex. The thread
				2689	** holding mutexMain can read this variable at any time.
				2690	** But is must hold mutexAux to change this variable. Other
drh	6a3d670	2006-02-10 13:11:32 +0000	[diff] [blame]	2691	** threads must hold mutexAux to read the variable and can
				2692	** never write.
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2693	**
				2694	** mutexOwner The thread id of the thread holding mutexMain. Same
				2695	** access rules as for inMutex.
				2696	**
drh	6a3d670	2006-02-10 13:11:32 +0000	[diff] [blame]	2697	** mutexOwnerValid True if the value in mutexOwner is valid. The same
				2698	** access rules apply as for inMutex.
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2699	**
				2700	** mutexMain The main mutex. Hold this mutex in order to get exclusive
				2701	** access to SQLite data structures.
				2702	**
				2703	** mutexAux An auxiliary mutex needed to access variables defined above.
				2704	**
drh	6a3d670	2006-02-10 13:11:32 +0000	[diff] [blame]	2705	** Mutexes are always acquired in this order: mutexMain mutexAux. It
				2706	** is not necessary to acquire mutexMain in order to get mutexAux - just
				2707	** do not attempt to acquire them in the reverse order: mutexAux mutexMain.
				2708	** Either get the mutexes with mutexMain first or get mutexAux only.
				2709	**
				2710	** When running on a platform where the three variables inMutex, mutexOwner,
				2711	** and mutexOwnerValid can be set atomically, the mutexAux is not required.
				2712	** On many systems, all three are 32-bit integers and writing to a 32-bit
				2713	** integer is atomic. I think. But there are no guarantees. So it seems
				2714	** safer to protect them using mutexAux.
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2715	*/
				2716	static int inMutex = 0;
drh	7906975	2004-05-22 21:30:40 +0000	[diff] [blame]	2717	#ifdef SQLITE_UNIX_THREADS
drh	6a3d670	2006-02-10 13:11:32 +0000	[diff] [blame]	2718	static pthread_t mutexOwner; /* Thread holding mutexMain */
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2719	static int mutexOwnerValid = 0; /* True if mutexOwner is valid */
				2720	static pthread_mutex_t mutexMain = PTHREAD_MUTEX_INITIALIZER; /* The mutex */
				2721	static pthread_mutex_t mutexAux = PTHREAD_MUTEX_INITIALIZER; /* Aux mutex */
drh	7906975	2004-05-22 21:30:40 +0000	[diff] [blame]	2722	#endif
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2723
				2724	/*
				2725	** The following pair of routine implement mutual exclusion for
				2726	** multi-threaded processes. Only a single thread is allowed to
				2727	** executed code that is surrounded by EnterMutex() and LeaveMutex().
				2728	**
				2729	** SQLite uses only a single Mutex. There is not much critical
				2730	** code and what little there is executes quickly and without blocking.
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	2731	**
drh	757b04e	2006-01-18 17:25:45 +0000	[diff] [blame]	2732	** As of version 3.3.2, this mutex must be recursive.
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2733	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	2734	void sqlite3UnixEnterMutex(){
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2735	#ifdef SQLITE_UNIX_THREADS
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2736	pthread_mutex_lock(&mutexAux);
				2737	if( !mutexOwnerValid \|\| !pthread_equal(mutexOwner, pthread_self()) ){
				2738	pthread_mutex_unlock(&mutexAux);
				2739	pthread_mutex_lock(&mutexMain);
				2740	assert( inMutex==0 );
				2741	assert( !mutexOwnerValid );
				2742	pthread_mutex_lock(&mutexAux);
drh	a3fad6f	2006-01-18 14:06:37 +0000	[diff] [blame]	2743	mutexOwner = pthread_self();
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2744	mutexOwnerValid = 1;
drh	a3fad6f	2006-01-18 14:06:37 +0000	[diff] [blame]	2745	}
drh	a3fad6f	2006-01-18 14:06:37 +0000	[diff] [blame]	2746	inMutex++;
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2747	pthread_mutex_unlock(&mutexAux);
				2748	#else
drh	e9565a6	2006-02-11 02:03:52 +0000	[diff] [blame]	2749	inMutex++;
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2750	#endif
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2751	}
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	2752	void sqlite3UnixLeaveMutex(){
drh	a3fad6f	2006-01-18 14:06:37 +0000	[diff] [blame]	2753	assert( inMutex>0 );
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2754	#ifdef SQLITE_UNIX_THREADS
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2755	pthread_mutex_lock(&mutexAux);
drh	a3fad6f	2006-01-18 14:06:37 +0000	[diff] [blame]	2756	inMutex--;
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2757	assert( pthread_equal(mutexOwner, pthread_self()) );
drh	a3fad6f	2006-01-18 14:06:37 +0000	[diff] [blame]	2758	if( inMutex==0 ){
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2759	assert( mutexOwnerValid );
				2760	mutexOwnerValid = 0;
				2761	pthread_mutex_unlock(&mutexMain);
drh	a3fad6f	2006-01-18 14:06:37 +0000	[diff] [blame]	2762	}
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2763	pthread_mutex_unlock(&mutexAux);
drh	a3fad6f	2006-01-18 14:06:37 +0000	[diff] [blame]	2764	#else
				2765	inMutex--;
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2766	#endif
				2767	}
				2768
				2769	/*
drh	757b04e	2006-01-18 17:25:45 +0000	[diff] [blame]	2770	** Return TRUE if the mutex is currently held.
				2771	**
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2772	** If the thisThrd parameter is true, return true only if the
drh	757b04e	2006-01-18 17:25:45 +0000	[diff] [blame]	2773	** calling thread holds the mutex. If the parameter is false, return
				2774	** true if any thread holds the mutex.
drh	88f474a	2006-01-02 20:00:12 +0000	[diff] [blame]	2775	*/
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2776	int sqlite3UnixInMutex(int thisThrd){
drh	a3fad6f	2006-01-18 14:06:37 +0000	[diff] [blame]	2777	#ifdef SQLITE_UNIX_THREADS
drh	5c11123	2006-02-10 04:33:12 +0000	[diff] [blame]	2778	int rc;
				2779	pthread_mutex_lock(&mutexAux);
				2780	rc = inMutex>0 && (thisThrd==0 \|\| pthread_equal(mutexOwner,pthread_self()));
				2781	pthread_mutex_unlock(&mutexAux);
				2782	return rc;
drh	a3fad6f	2006-01-18 14:06:37 +0000	[diff] [blame]	2783	#else
drh	757b04e	2006-01-18 17:25:45 +0000	[diff] [blame]	2784	return inMutex>0;
drh	a3fad6f	2006-01-18 14:06:37 +0000	[diff] [blame]	2785	#endif
drh	88f474a	2006-01-02 20:00:12 +0000	[diff] [blame]	2786	}
				2787
				2788	/*
drh	b4bc705	2006-01-11 23:40:33 +0000	[diff] [blame]	2789	** Remember the number of thread-specific-data blocks allocated.
				2790	** Use this to verify that we are not leaking thread-specific-data.
				2791	** Ticket #1601
				2792	*/
				2793	#ifdef SQLITE_TEST
				2794	int sqlite3_tsd_count = 0;
				2795	# ifdef SQLITE_UNIX_THREADS
				2796	static pthread_mutex_t tsd_counter_mutex = PTHREAD_MUTEX_INITIALIZER;
				2797	# define TSD_COUNTER(N) \
				2798	pthread_mutex_lock(&tsd_counter_mutex); \
				2799	sqlite3_tsd_count += N; \
				2800	pthread_mutex_unlock(&tsd_counter_mutex);
				2801	# else
				2802	# define TSD_COUNTER(N) sqlite3_tsd_count += N
				2803	# endif
				2804	#else
				2805	# define TSD_COUNTER(N) /* no-op */
				2806	#endif
				2807
drh	b4bc705	2006-01-11 23:40:33 +0000	[diff] [blame]	2808	/*
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	2809	** If called with allocateFlag>0, then return a pointer to thread
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2810	** specific data for the current thread. Allocate and zero the
drh	f1a221e	2006-01-15 17:27:17 +0000	[diff] [blame]	2811	** thread-specific data if it does not already exist.
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2812	**
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2813	** If called with allocateFlag==0, then check the current thread
drh	70ff98a	2006-01-12 01:25:18 +0000	[diff] [blame]	2814	** specific data. Return it if it exists. If it does not exist,
				2815	** then return NULL.
				2816	**
				2817	** If called with allocateFlag<0, check to see if the thread specific
				2818	** data is allocated and is all zero. If it is then deallocate it.
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2819	** Return a pointer to the thread specific data or NULL if it is
drh	70ff98a	2006-01-12 01:25:18 +0000	[diff] [blame]	2820	** unallocated or gets deallocated.
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2821	*/
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2822	ThreadData *sqlite3UnixThreadSpecificData(int allocateFlag){
danielk1977	4d5238f	2006-01-27 06:32:00 +0000	[diff] [blame]	2823	static const ThreadData zeroData = {0}; /* Initializer to silence warnings
				2824	** from broken compilers */
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2825	#ifdef SQLITE_UNIX_THREADS
				2826	static pthread_key_t key;
				2827	static int keyInit = 0;
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2828	ThreadData *pTsd;
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2829
				2830	if( !keyInit ){
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	2831	sqlite3OsEnterMutex();
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2832	if( !keyInit ){
				2833	int rc;
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2834	rc = pthread_key_create(&key, 0);
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2835	if( rc ){
drh	8c0ca7d	2006-01-07 04:06:54 +0000	[diff] [blame]	2836	sqlite3OsLeaveMutex();
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2837	return 0;
				2838	}
				2839	keyInit = 1;
				2840	}
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	2841	sqlite3OsLeaveMutex();
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2842	}
				2843
drh	3fbb0b1	2006-01-06 00:36:00 +0000	[diff] [blame]	2844	pTsd = pthread_getspecific(key);
drh	70ff98a	2006-01-12 01:25:18 +0000	[diff] [blame]	2845	if( allocateFlag>0 ){
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2846	if( pTsd==0 ){
danielk1977	76e8d1a	2006-01-18 18:22:43 +0000	[diff] [blame]	2847	if( !sqlite3TestMallocFail() ){
				2848	pTsd = sqlite3OsMalloc(sizeof(zeroData));
				2849	}
				2850	#ifdef SQLITE_MEMDEBUG
				2851	sqlite3_isFail = 0;
				2852	#endif
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2853	if( pTsd ){
				2854	*pTsd = zeroData;
				2855	pthread_setspecific(key, pTsd);
drh	b4bc705	2006-01-11 23:40:33 +0000	[diff] [blame]	2856	TSD_COUNTER(+1);
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2857	}
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2858	}
drh	70ff98a	2006-01-12 01:25:18 +0000	[diff] [blame]	2859	}else if( pTsd!=0 && allocateFlag<0
danielk1977	9e12800	2006-01-18 16:51:35 +0000	[diff] [blame]	2860	&& memcmp(pTsd, &zeroData, sizeof(ThreadData))==0 ){
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2861	sqlite3OsFree(pTsd);
				2862	pthread_setspecific(key, 0);
drh	b4bc705	2006-01-11 23:40:33 +0000	[diff] [blame]	2863	TSD_COUNTER(-1);
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2864	pTsd = 0;
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2865	}
				2866	return pTsd;
				2867	#else
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2868	static ThreadData *pTsd = 0;
drh	70ff98a	2006-01-12 01:25:18 +0000	[diff] [blame]	2869	if( allocateFlag>0 ){
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2870	if( pTsd==0 ){
danielk1977	76e8d1a	2006-01-18 18:22:43 +0000	[diff] [blame]	2871	if( !sqlite3TestMallocFail() ){
				2872	pTsd = sqlite3OsMalloc( sizeof(zeroData) );
				2873	}
				2874	#ifdef SQLITE_MEMDEBUG
				2875	sqlite3_isFail = 0;
				2876	#endif
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2877	if( pTsd ){
				2878	*pTsd = zeroData;
drh	b4bc705	2006-01-11 23:40:33 +0000	[diff] [blame]	2879	TSD_COUNTER(+1);
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2880	}
drh	3fbb0b1	2006-01-06 00:36:00 +0000	[diff] [blame]	2881	}
drh	70ff98a	2006-01-12 01:25:18 +0000	[diff] [blame]	2882	}else if( pTsd!=0 && allocateFlag<0
danielk1977	9e12800	2006-01-18 16:51:35 +0000	[diff] [blame]	2883	&& memcmp(pTsd, &zeroData, sizeof(ThreadData))==0 ){
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2884	sqlite3OsFree(pTsd);
drh	b4bc705	2006-01-11 23:40:33 +0000	[diff] [blame]	2885	TSD_COUNTER(-1);
drh	6f7adc8	2006-01-11 21:41:20 +0000	[diff] [blame]	2886	pTsd = 0;
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2887	}
drh	3fbb0b1	2006-01-06 00:36:00 +0000	[diff] [blame]	2888	return pTsd;
danielk1977	13a68c3	2005-12-15 10:11:30 +0000	[diff] [blame]	2889	#endif
				2890	}
				2891
				2892	/*
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2893	** The following variable, if set to a non-zero value, becomes the result
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	2894	** returned from sqlite3OsCurrentTime(). This is used for testing.
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2895	*/
				2896	#ifdef SQLITE_TEST
				2897	int sqlite3_current_time = 0;
				2898	#endif
				2899
				2900	/*
				2901	** Find the current time (in Universal Coordinated Time). Write the
				2902	** current time and date as a Julian Day number into *prNow and
				2903	** return 0. Return 1 if the time and date cannot be found.
				2904	*/
drh	66560ad	2006-01-06 14:32:19 +0000	[diff] [blame]	2905	int sqlite3UnixCurrentTime(double *prNow){
drh	19e2d37	2005-08-29 23:00:03 +0000	[diff] [blame]	2906	#ifdef NO_GETTOD
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2907	time_t t;
				2908	time(&t);
				2909	*prNow = t/86400.0 + 2440587.5;
drh	19e2d37	2005-08-29 23:00:03 +0000	[diff] [blame]	2910	#else
				2911	struct timeval sNow;
				2912	struct timezone sTz; /* Not used */
				2913	gettimeofday(&sNow, &sTz);
				2914	*prNow = 2440587.5 + sNow.tv_sec/86400.0 + sNow.tv_usec/86400000000.0;
				2915	#endif
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2916	#ifdef SQLITE_TEST
				2917	if( sqlite3_current_time ){
				2918	*prNow = sqlite3_current_time/86400.0 + 2440587.5;
				2919	}
				2920	#endif
				2921	return 0;
				2922	}
				2923
drh	bbd42a6	2004-05-22 17:41:58 +0000	[diff] [blame]	2924	#endif /* OS_UNIX */