xref: /sqlite-3.40.0/src/vacuum.c (revision ee751fab)
1 /*
2 ** 2003 April 6
3 **
4 ** The author disclaims copyright to this source code.  In place of
5 ** a legal notice, here is a blessing:
6 **
7 **    May you do good and not evil.
8 **    May you find forgiveness for yourself and forgive others.
9 **    May you share freely, never taking more than you give.
10 **
11 *************************************************************************
12 ** This file contains code used to implement the VACUUM command.
13 **
14 ** Most of the code in this file may be omitted by defining the
15 ** SQLITE_OMIT_VACUUM macro.
16 */
17 #include "sqliteInt.h"
18 #include "vdbeInt.h"
19 
20 #if !defined(SQLITE_OMIT_VACUUM) && !defined(SQLITE_OMIT_ATTACH)
21 
22 /*
23 ** Execute zSql on database db.
24 **
25 ** If zSql returns rows, then each row will have exactly one
26 ** column.  (This will only happen if zSql begins with "SELECT".)
27 ** Take each row of result and call execSql() again recursively.
28 **
29 ** The execSqlF() routine does the same thing, except it accepts
30 ** a format string as its third argument
31 */
32 static int execSql(sqlite3 *db, char **pzErrMsg, const char *zSql){
33   sqlite3_stmt *pStmt;
34   int rc;
35 
36   /* printf("SQL: [%s]\n", zSql); fflush(stdout); */
37   rc = sqlite3_prepare_v2(db, zSql, -1, &pStmt, 0);
38   if( rc!=SQLITE_OK ) return rc;
39   while( SQLITE_ROW==(rc = sqlite3_step(pStmt)) ){
40     const char *zSubSql = (const char*)sqlite3_column_text(pStmt,0);
41     assert( sqlite3_strnicmp(zSql,"SELECT",6)==0 );
42     /* The secondary SQL must be one of CREATE TABLE, CREATE INDEX,
43     ** or INSERT.  Historically there have been attacks that first
44     ** corrupt the sqlite_master.sql field with other kinds of statements
45     ** then run VACUUM to get those statements to execute at inappropriate
46     ** times. */
47     if( zSubSql
48      && (strncmp(zSubSql,"CRE",3)==0 || strncmp(zSubSql,"INS",3)==0)
49     ){
50       rc = execSql(db, pzErrMsg, zSubSql);
51       if( rc!=SQLITE_OK ) break;
52     }
53   }
54   assert( rc!=SQLITE_ROW );
55   if( rc==SQLITE_DONE ) rc = SQLITE_OK;
56   if( rc ){
57     sqlite3SetString(pzErrMsg, db, sqlite3_errmsg(db));
58   }
59   (void)sqlite3_finalize(pStmt);
60   return rc;
61 }
62 static int execSqlF(sqlite3 *db, char **pzErrMsg, const char *zSql, ...){
63   char *z;
64   va_list ap;
65   int rc;
66   va_start(ap, zSql);
67   z = sqlite3VMPrintf(db, zSql, ap);
68   va_end(ap);
69   if( z==0 ) return SQLITE_NOMEM;
70   rc = execSql(db, pzErrMsg, z);
71   sqlite3DbFree(db, z);
72   return rc;
73 }
74 
75 /*
76 ** The VACUUM command is used to clean up the database,
77 ** collapse free space, etc.  It is modelled after the VACUUM command
78 ** in PostgreSQL.  The VACUUM command works as follows:
79 **
80 **   (1)  Create a new transient database file
81 **   (2)  Copy all content from the database being vacuumed into
82 **        the new transient database file
83 **   (3)  Copy content from the transient database back into the
84 **        original database.
85 **
86 ** The transient database requires temporary disk space approximately
87 ** equal to the size of the original database.  The copy operation of
88 ** step (3) requires additional temporary disk space approximately equal
89 ** to the size of the original database for the rollback journal.
90 ** Hence, temporary disk space that is approximately 2x the size of the
91 ** original database is required.  Every page of the database is written
92 ** approximately 3 times:  Once for step (2) and twice for step (3).
93 ** Two writes per page are required in step (3) because the original
94 ** database content must be written into the rollback journal prior to
95 ** overwriting the database with the vacuumed content.
96 **
97 ** Only 1x temporary space and only 1x writes would be required if
98 ** the copy of step (3) were replaced by deleting the original database
99 ** and renaming the transient database as the original.  But that will
100 ** not work if other processes are attached to the original database.
101 ** And a power loss in between deleting the original and renaming the
102 ** transient would cause the database file to appear to be deleted
103 ** following reboot.
104 */
105 void sqlite3Vacuum(Parse *pParse, Token *pNm, Expr *pInto){
106   Vdbe *v = sqlite3GetVdbe(pParse);
107   int iDb = 0;
108   if( v==0 ) goto build_vacuum_end;
109   if( pNm ){
110 #ifndef SQLITE_BUG_COMPATIBLE_20160819
111     /* Default behavior:  Report an error if the argument to VACUUM is
112     ** not recognized */
113     iDb = sqlite3TwoPartName(pParse, pNm, pNm, &pNm);
114     if( iDb<0 ) goto build_vacuum_end;
115 #else
116     /* When SQLITE_BUG_COMPATIBLE_20160819 is defined, unrecognized arguments
117     ** to VACUUM are silently ignored.  This is a back-out of a bug fix that
118     ** occurred on 2016-08-19 (https://www.sqlite.org/src/info/083f9e6270).
119     ** The buggy behavior is required for binary compatibility with some
120     ** legacy applications. */
121     iDb = sqlite3FindDb(pParse->db, pNm);
122     if( iDb<0 ) iDb = 0;
123 #endif
124   }
125   if( iDb!=1 ){
126     int iIntoReg = 0;
127     if( pInto && sqlite3ResolveSelfReference(pParse,0,0,pInto,0)==0 ){
128       iIntoReg = ++pParse->nMem;
129       sqlite3ExprCode(pParse, pInto, iIntoReg);
130     }
131     sqlite3VdbeAddOp2(v, OP_Vacuum, iDb, iIntoReg);
132     sqlite3VdbeUsesBtree(v, iDb);
133   }
134 build_vacuum_end:
135   sqlite3ExprDelete(pParse->db, pInto);
136   return;
137 }
138 
139 /*
140 ** This routine implements the OP_Vacuum opcode of the VDBE.
141 */
142 int sqlite3RunVacuum(
143   char **pzErrMsg,        /* Write error message here */
144   sqlite3 *db,            /* Database connection */
145   int iDb,                /* Which attached DB to vacuum */
146   sqlite3_value *pOut     /* Write results here, if not NULL */
147 ){
148   int rc = SQLITE_OK;     /* Return code from service routines */
149   Btree *pMain;           /* The database being vacuumed */
150   Btree *pTemp;           /* The temporary database we vacuum into */
151   u32 saved_mDbFlags;     /* Saved value of db->mDbFlags */
152   u64 saved_flags;        /* Saved value of db->flags */
153   int saved_nChange;      /* Saved value of db->nChange */
154   int saved_nTotalChange; /* Saved value of db->nTotalChange */
155   u8 saved_mTrace;        /* Saved trace settings */
156   Db *pDb = 0;            /* Database to detach at end of vacuum */
157   int isMemDb;            /* True if vacuuming a :memory: database */
158   int nRes;               /* Bytes of reserved space at the end of each page */
159   int nDb;                /* Number of attached databases */
160   const char *zDbMain;    /* Schema name of database to vacuum */
161   const char *zOut;       /* Name of output file */
162 
163   if( !db->autoCommit ){
164     sqlite3SetString(pzErrMsg, db, "cannot VACUUM from within a transaction");
165     return SQLITE_ERROR;
166   }
167   if( db->nVdbeActive>1 ){
168     sqlite3SetString(pzErrMsg, db,"cannot VACUUM - SQL statements in progress");
169     return SQLITE_ERROR;
170   }
171   if( pOut ){
172     if( sqlite3_value_type(pOut)!=SQLITE_TEXT ){
173       sqlite3SetString(pzErrMsg, db, "non-text filename");
174       return SQLITE_ERROR;
175     }
176     zOut = (const char*)sqlite3_value_text(pOut);
177   }else{
178     zOut = "";
179   }
180 
181   /* Save the current value of the database flags so that it can be
182   ** restored before returning. Then set the writable-schema flag, and
183   ** disable CHECK and foreign key constraints.  */
184   saved_flags = db->flags;
185   saved_mDbFlags = db->mDbFlags;
186   saved_nChange = db->nChange;
187   saved_nTotalChange = db->nTotalChange;
188   saved_mTrace = db->mTrace;
189   db->flags |= SQLITE_WriteSchema | SQLITE_IgnoreChecks;
190   db->mDbFlags |= DBFLAG_PreferBuiltin | DBFLAG_Vacuum;
191   db->flags &= ~(u64)(SQLITE_ForeignKeys | SQLITE_ReverseOrder
192                    | SQLITE_Defensive | SQLITE_CountRows);
193   db->mTrace = 0;
194 
195   zDbMain = db->aDb[iDb].zDbSName;
196   pMain = db->aDb[iDb].pBt;
197   isMemDb = sqlite3PagerIsMemdb(sqlite3BtreePager(pMain));
198 
199   /* Attach the temporary database as 'vacuum_db'. The synchronous pragma
200   ** can be set to 'off' for this file, as it is not recovered if a crash
201   ** occurs anyway. The integrity of the database is maintained by a
202   ** (possibly synchronous) transaction opened on the main database before
203   ** sqlite3BtreeCopyFile() is called.
204   **
205   ** An optimisation would be to use a non-journaled pager.
206   ** (Later:) I tried setting "PRAGMA vacuum_db.journal_mode=OFF" but
207   ** that actually made the VACUUM run slower.  Very little journalling
208   ** actually occurs when doing a vacuum since the vacuum_db is initially
209   ** empty.  Only the journal header is written.  Apparently it takes more
210   ** time to parse and run the PRAGMA to turn journalling off than it does
211   ** to write the journal header file.
212   */
213   nDb = db->nDb;
214   rc = execSqlF(db, pzErrMsg, "ATTACH %Q AS vacuum_db", zOut);
215   if( rc!=SQLITE_OK ) goto end_of_vacuum;
216   assert( (db->nDb-1)==nDb );
217   pDb = &db->aDb[nDb];
218   assert( strcmp(pDb->zDbSName,"vacuum_db")==0 );
219   pTemp = pDb->pBt;
220   if( pOut ){
221     sqlite3_file *id = sqlite3PagerFile(sqlite3BtreePager(pTemp));
222     i64 sz = 0;
223     if( id->pMethods!=0 && (sqlite3OsFileSize(id, &sz)!=SQLITE_OK || sz>0) ){
224       rc = SQLITE_ERROR;
225       sqlite3SetString(pzErrMsg, db, "output file already exists");
226       goto end_of_vacuum;
227     }
228   }
229   nRes = sqlite3BtreeGetOptimalReserve(pMain);
230 
231   /* A VACUUM cannot change the pagesize of an encrypted database. */
232 #ifdef SQLITE_HAS_CODEC
233   if( db->nextPagesize ){
234     extern void sqlite3CodecGetKey(sqlite3*, int, void**, int*);
235     int nKey;
236     char *zKey;
237     sqlite3CodecGetKey(db, iDb, (void**)&zKey, &nKey);
238     if( nKey ) db->nextPagesize = 0;
239   }
240 #endif
241 
242   sqlite3BtreeSetCacheSize(pTemp, db->aDb[iDb].pSchema->cache_size);
243   sqlite3BtreeSetSpillSize(pTemp, sqlite3BtreeSetSpillSize(pMain,0));
244   sqlite3BtreeSetPagerFlags(pTemp, PAGER_SYNCHRONOUS_OFF|PAGER_CACHESPILL);
245 
246   /* Begin a transaction and take an exclusive lock on the main database
247   ** file. This is done before the sqlite3BtreeGetPageSize(pMain) call below,
248   ** to ensure that we do not try to change the page-size on a WAL database.
249   */
250   rc = execSql(db, pzErrMsg, "BEGIN");
251   if( rc!=SQLITE_OK ) goto end_of_vacuum;
252   rc = sqlite3BtreeBeginTrans(pMain, pOut==0 ? 2 : 0, 0);
253   if( rc!=SQLITE_OK ) goto end_of_vacuum;
254 
255   /* Do not attempt to change the page size for a WAL database */
256   if( sqlite3PagerGetJournalMode(sqlite3BtreePager(pMain))
257                                                ==PAGER_JOURNALMODE_WAL ){
258     db->nextPagesize = 0;
259   }
260 
261   if( sqlite3BtreeSetPageSize(pTemp, sqlite3BtreeGetPageSize(pMain), nRes, 0)
262    || (!isMemDb && sqlite3BtreeSetPageSize(pTemp, db->nextPagesize, nRes, 0))
263    || NEVER(db->mallocFailed)
264   ){
265     rc = SQLITE_NOMEM_BKPT;
266     goto end_of_vacuum;
267   }
268 
269 #ifndef SQLITE_OMIT_AUTOVACUUM
270   sqlite3BtreeSetAutoVacuum(pTemp, db->nextAutovac>=0 ? db->nextAutovac :
271                                            sqlite3BtreeGetAutoVacuum(pMain));
272 #endif
273 
274   /* Query the schema of the main database. Create a mirror schema
275   ** in the temporary database.
276   */
277   db->init.iDb = nDb; /* force new CREATE statements into vacuum_db */
278   rc = execSqlF(db, pzErrMsg,
279       "SELECT sql FROM \"%w\".sqlite_master"
280       " WHERE type='table'AND name<>'sqlite_sequence'"
281       " AND coalesce(rootpage,1)>0",
282       zDbMain
283   );
284   if( rc!=SQLITE_OK ) goto end_of_vacuum;
285   rc = execSqlF(db, pzErrMsg,
286       "SELECT sql FROM \"%w\".sqlite_master"
287       " WHERE type='index'",
288       zDbMain
289   );
290   if( rc!=SQLITE_OK ) goto end_of_vacuum;
291   db->init.iDb = 0;
292 
293   /* Loop through the tables in the main database. For each, do
294   ** an "INSERT INTO vacuum_db.xxx SELECT * FROM main.xxx;" to copy
295   ** the contents to the temporary database.
296   */
297   rc = execSqlF(db, pzErrMsg,
298       "SELECT'INSERT INTO vacuum_db.'||quote(name)"
299       "||' SELECT*FROM\"%w\".'||quote(name)"
300       "FROM vacuum_db.sqlite_master "
301       "WHERE type='table'AND coalesce(rootpage,1)>0",
302       zDbMain
303   );
304   assert( (db->mDbFlags & DBFLAG_Vacuum)!=0 );
305   db->mDbFlags &= ~DBFLAG_Vacuum;
306   if( rc!=SQLITE_OK ) goto end_of_vacuum;
307 
308   /* Copy the triggers, views, and virtual tables from the main database
309   ** over to the temporary database.  None of these objects has any
310   ** associated storage, so all we have to do is copy their entries
311   ** from the SQLITE_MASTER table.
312   */
313   rc = execSqlF(db, pzErrMsg,
314       "INSERT INTO vacuum_db.sqlite_master"
315       " SELECT*FROM \"%w\".sqlite_master"
316       " WHERE type IN('view','trigger')"
317       " OR(type='table'AND rootpage=0)",
318       zDbMain
319   );
320   if( rc ) goto end_of_vacuum;
321 
322   /* At this point, there is a write transaction open on both the
323   ** vacuum database and the main database. Assuming no error occurs,
324   ** both transactions are closed by this block - the main database
325   ** transaction by sqlite3BtreeCopyFile() and the other by an explicit
326   ** call to sqlite3BtreeCommit().
327   */
328   {
329     u32 meta;
330     int i;
331 
332     /* This array determines which meta meta values are preserved in the
333     ** vacuum.  Even entries are the meta value number and odd entries
334     ** are an increment to apply to the meta value after the vacuum.
335     ** The increment is used to increase the schema cookie so that other
336     ** connections to the same database will know to reread the schema.
337     */
338     static const unsigned char aCopy[] = {
339        BTREE_SCHEMA_VERSION,     1,  /* Add one to the old schema cookie */
340        BTREE_DEFAULT_CACHE_SIZE, 0,  /* Preserve the default page cache size */
341        BTREE_TEXT_ENCODING,      0,  /* Preserve the text encoding */
342        BTREE_USER_VERSION,       0,  /* Preserve the user version */
343        BTREE_APPLICATION_ID,     0,  /* Preserve the application id */
344     };
345 
346     assert( 1==sqlite3BtreeIsInTrans(pTemp) );
347     assert( pOut!=0 || 1==sqlite3BtreeIsInTrans(pMain) );
348 
349     /* Copy Btree meta values */
350     for(i=0; i<ArraySize(aCopy); i+=2){
351       /* GetMeta() and UpdateMeta() cannot fail in this context because
352       ** we already have page 1 loaded into cache and marked dirty. */
353       sqlite3BtreeGetMeta(pMain, aCopy[i], &meta);
354       rc = sqlite3BtreeUpdateMeta(pTemp, aCopy[i], meta+aCopy[i+1]);
355       if( NEVER(rc!=SQLITE_OK) ) goto end_of_vacuum;
356     }
357 
358     if( pOut==0 ){
359       rc = sqlite3BtreeCopyFile(pMain, pTemp);
360     }
361     if( rc!=SQLITE_OK ) goto end_of_vacuum;
362     rc = sqlite3BtreeCommit(pTemp);
363     if( rc!=SQLITE_OK ) goto end_of_vacuum;
364 #ifndef SQLITE_OMIT_AUTOVACUUM
365     if( pOut==0 ){
366       sqlite3BtreeSetAutoVacuum(pMain, sqlite3BtreeGetAutoVacuum(pTemp));
367     }
368 #endif
369   }
370 
371   assert( rc==SQLITE_OK );
372   if( pOut==0 ){
373     rc = sqlite3BtreeSetPageSize(pMain, sqlite3BtreeGetPageSize(pTemp), nRes,1);
374   }
375 
376 end_of_vacuum:
377   /* Restore the original value of db->flags */
378   db->init.iDb = 0;
379   db->mDbFlags = saved_mDbFlags;
380   db->flags = saved_flags;
381   db->nChange = saved_nChange;
382   db->nTotalChange = saved_nTotalChange;
383   db->mTrace = saved_mTrace;
384   sqlite3BtreeSetPageSize(pMain, -1, -1, 1);
385 
386   /* Currently there is an SQL level transaction open on the vacuum
387   ** database. No locks are held on any other files (since the main file
388   ** was committed at the btree level). So it safe to end the transaction
389   ** by manually setting the autoCommit flag to true and detaching the
390   ** vacuum database. The vacuum_db journal file is deleted when the pager
391   ** is closed by the DETACH.
392   */
393   db->autoCommit = 1;
394 
395   if( pDb ){
396     sqlite3BtreeClose(pDb->pBt);
397     pDb->pBt = 0;
398     pDb->pSchema = 0;
399   }
400 
401   /* This both clears the schemas and reduces the size of the db->aDb[]
402   ** array. */
403   sqlite3ResetAllSchemasOfConnection(db);
404 
405   return rc;
406 }
407 
408 #endif  /* SQLITE_OMIT_VACUUM && SQLITE_OMIT_ATTACH */
409