1// Copyright (c) 2012 The Chromium Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
5#ifndef SQL_CONNECTION_H_
6#define SQL_CONNECTION_H_
7
8#include <map>
9#include <set>
10#include <string>
11#include <vector>
12
13#include "base/basictypes.h"
14#include "base/callback.h"
15#include "base/compiler_specific.h"
16#include "base/memory/ref_counted.h"
17#include "base/memory/scoped_ptr.h"
18#include "base/threading/thread_restrictions.h"
19#include "base/time/time.h"
20#include "sql/sql_export.h"
21
22struct sqlite3;
23struct sqlite3_stmt;
24
25namespace base {
26class FilePath;
27}
28
29namespace sql {
30
31class Recovery;
32class Statement;
33
34// Uniquely identifies a statement. There are two modes of operation:
35//
36// - In the most common mode, you will use the source file and line number to
37//   identify your statement. This is a convienient way to get uniqueness for
38//   a statement that is only used in one place. Use the SQL_FROM_HERE macro
39//   to generate a StatementID.
40//
41// - In the "custom" mode you may use the statement from different places or
42//   need to manage it yourself for whatever reason. In this case, you should
43//   make up your own unique name and pass it to the StatementID. This name
44//   must be a static string, since this object only deals with pointers and
45//   assumes the underlying string doesn't change or get deleted.
46//
47// This object is copyable and assignable using the compiler-generated
48// operator= and copy constructor.
49class StatementID {
50 public:
51  // Creates a uniquely named statement with the given file ane line number.
52  // Normally you will use SQL_FROM_HERE instead of calling yourself.
53  StatementID(const char* file, int line)
54      : number_(line),
55        str_(file) {
56  }
57
58  // Creates a uniquely named statement with the given user-defined name.
59  explicit StatementID(const char* unique_name)
60      : number_(-1),
61        str_(unique_name) {
62  }
63
64  // This constructor is unimplemented and will generate a linker error if
65  // called. It is intended to try to catch people dynamically generating
66  // a statement name that will be deallocated and will cause a crash later.
67  // All strings must be static and unchanging!
68  explicit StatementID(const std::string& dont_ever_do_this);
69
70  // We need this to insert into our map.
71  bool operator<(const StatementID& other) const;
72
73 private:
74  int number_;
75  const char* str_;
76};
77
78#define SQL_FROM_HERE sql::StatementID(__FILE__, __LINE__)
79
80class Connection;
81
82class SQL_EXPORT Connection {
83 private:
84  class StatementRef;  // Forward declaration, see real one below.
85
86 public:
87  // The database is opened by calling Open[InMemory](). Any uncommitted
88  // transactions will be rolled back when this object is deleted.
89  Connection();
90  ~Connection();
91
92  // Pre-init configuration ----------------------------------------------------
93
94  // Sets the page size that will be used when creating a new database. This
95  // must be called before Init(), and will only have an effect on new
96  // databases.
97  //
98  // From sqlite.org: "The page size must be a power of two greater than or
99  // equal to 512 and less than or equal to SQLITE_MAX_PAGE_SIZE. The maximum
100  // value for SQLITE_MAX_PAGE_SIZE is 32768."
101  void set_page_size(int page_size) { page_size_ = page_size; }
102
103  // Sets the number of pages that will be cached in memory by sqlite. The
104  // total cache size in bytes will be page_size * cache_size. This must be
105  // called before Open() to have an effect.
106  void set_cache_size(int cache_size) { cache_size_ = cache_size; }
107
108  // Call to put the database in exclusive locking mode. There is no "back to
109  // normal" flag because of some additional requirements sqlite puts on this
110  // transaction (requires another access to the DB) and because we don't
111  // actually need it.
112  //
113  // Exclusive mode means that the database is not unlocked at the end of each
114  // transaction, which means there may be less time spent initializing the
115  // next transaction because it doesn't have to re-aquire locks.
116  //
117  // This must be called before Open() to have an effect.
118  void set_exclusive_locking() { exclusive_locking_ = true; }
119
120  // Call to cause Open() to restrict access permissions of the
121  // database file to only the owner.
122  // TODO(shess): Currently only supported on OS_POSIX, is a noop on
123  // other platforms.
124  void set_restrict_to_user() { restrict_to_user_ = true; }
125
126  // Set an error-handling callback.  On errors, the error number (and
127  // statement, if available) will be passed to the callback.
128  //
129  // If no callback is set, the default action is to crash in debug
130  // mode or return failure in release mode.
131  typedef base::Callback<void(int, Statement*)> ErrorCallback;
132  void set_error_callback(const ErrorCallback& callback) {
133    error_callback_ = callback;
134  }
135  bool has_error_callback() const {
136    return !error_callback_.is_null();
137  }
138  void reset_error_callback() {
139    error_callback_.Reset();
140  }
141
142  // Set this tag to enable additional connection-type histogramming
143  // for SQLite error codes and database version numbers.
144  void set_histogram_tag(const std::string& tag) {
145    histogram_tag_ = tag;
146  }
147
148  // Record a sparse UMA histogram sample under
149  // |name|+"."+|histogram_tag_|.  If |histogram_tag_| is empty, no
150  // histogram is recorded.
151  void AddTaggedHistogram(const std::string& name, size_t sample) const;
152
153  // Run "PRAGMA integrity_check" and post each line of
154  // results into |messages|.  Returns the success of running the
155  // statement - per the SQLite documentation, if no errors are found the
156  // call should succeed, and a single value "ok" should be in messages.
157  bool FullIntegrityCheck(std::vector<std::string>* messages);
158
159  // Runs "PRAGMA quick_check" and, unlike the FullIntegrityCheck method,
160  // interprets the results returning true if the the statement executes
161  // without error and results in a single "ok" value.
162  bool QuickIntegrityCheck() WARN_UNUSED_RESULT;
163
164  // Initialization ------------------------------------------------------------
165
166  // Initializes the SQL connection for the given file, returning true if the
167  // file could be opened. You can call this or OpenInMemory.
168  bool Open(const base::FilePath& path) WARN_UNUSED_RESULT;
169
170  // Initializes the SQL connection for a temporary in-memory database. There
171  // will be no associated file on disk, and the initial database will be
172  // empty. You can call this or Open.
173  bool OpenInMemory() WARN_UNUSED_RESULT;
174
175  // Create a temporary on-disk database.  The database will be
176  // deleted after close.  This kind of database is similar to
177  // OpenInMemory() for small databases, but can page to disk if the
178  // database becomes large.
179  bool OpenTemporary() WARN_UNUSED_RESULT;
180
181  // Returns true if the database has been successfully opened.
182  bool is_open() const { return !!db_; }
183
184  // Closes the database. This is automatically performed on destruction for
185  // you, but this allows you to close the database early. You must not call
186  // any other functions after closing it. It is permissable to call Close on
187  // an uninitialized or already-closed database.
188  void Close();
189
190  // Reads the first <cache-size>*<page-size> bytes of the file to prime the
191  // filesystem cache.  This can be more efficient than faulting pages
192  // individually.  Since this involves blocking I/O, it should only be used if
193  // the caller will immediately read a substantial amount of data from the
194  // database.
195  //
196  // TODO(shess): Design a set of histograms or an experiment to inform this
197  // decision.  Preloading should almost always improve later performance
198  // numbers for this database simply because it pulls operations forward, but
199  // if the data isn't actually used soon then preloading just slows down
200  // everything else.
201  void Preload();
202
203  // Try to trim the cache memory used by the database.  If |aggressively| is
204  // true, this function will try to free all of the cache memory it can. If
205  // |aggressively| is false, this function will try to cut cache memory
206  // usage by half.
207  void TrimMemory(bool aggressively);
208
209  // Raze the database to the ground.  This approximates creating a
210  // fresh database from scratch, within the constraints of SQLite's
211  // locking protocol (locks and open handles can make doing this with
212  // filesystem operations problematic).  Returns true if the database
213  // was razed.
214  //
215  // false is returned if the database is locked by some other
216  // process.  RazeWithTimeout() may be used if appropriate.
217  //
218  // NOTE(shess): Raze() will DCHECK in the following situations:
219  // - database is not open.
220  // - the connection has a transaction open.
221  // - a SQLite issue occurs which is structural in nature (like the
222  //   statements used are broken).
223  // Since Raze() is expected to be called in unexpected situations,
224  // these all return false, since it is unlikely that the caller
225  // could fix them.
226  //
227  // The database's page size is taken from |page_size_|.  The
228  // existing database's |auto_vacuum| setting is lost (the
229  // possibility of corruption makes it unreliable to pull it from the
230  // existing database).  To re-enable on the empty database requires
231  // running "PRAGMA auto_vacuum = 1;" then "VACUUM".
232  //
233  // NOTE(shess): For Android, SQLITE_DEFAULT_AUTOVACUUM is set to 1,
234  // so Raze() sets auto_vacuum to 1.
235  //
236  // TODO(shess): Raze() needs a connection so cannot clear SQLITE_NOTADB.
237  // TODO(shess): Bake auto_vacuum into Connection's API so it can
238  // just pick up the default.
239  bool Raze();
240  bool RazeWithTimout(base::TimeDelta timeout);
241
242  // Breaks all outstanding transactions (as initiated by
243  // BeginTransaction()), closes the SQLite database, and poisons the
244  // object so that all future operations against the Connection (or
245  // its Statements) fail safely, without side effects.
246  //
247  // This is intended as an alternative to Close() in error callbacks.
248  // Close() should still be called at some point.
249  void Poison();
250
251  // Raze() the database and Poison() the handle.  Returns the return
252  // value from Raze().
253  // TODO(shess): Rename to RazeAndPoison().
254  bool RazeAndClose();
255
256  // Delete the underlying database files associated with |path|.
257  // This should be used on a database which has no existing
258  // connections.  If any other connections are open to the same
259  // database, this could cause odd results or corruption (for
260  // instance if a hot journal is deleted but the associated database
261  // is not).
262  //
263  // Returns true if the database file and associated journals no
264  // longer exist, false otherwise.  If the database has never
265  // existed, this will return true.
266  static bool Delete(const base::FilePath& path);
267
268  // Transactions --------------------------------------------------------------
269
270  // Transaction management. We maintain a virtual transaction stack to emulate
271  // nested transactions since sqlite can't do nested transactions. The
272  // limitation is you can't roll back a sub transaction: if any transaction
273  // fails, all transactions open will also be rolled back. Any nested
274  // transactions after one has rolled back will return fail for Begin(). If
275  // Begin() fails, you must not call Commit or Rollback().
276  //
277  // Normally you should use sql::Transaction to manage a transaction, which
278  // will scope it to a C++ context.
279  bool BeginTransaction();
280  void RollbackTransaction();
281  bool CommitTransaction();
282
283  // Rollback all outstanding transactions.  Use with care, there may
284  // be scoped transactions on the stack.
285  void RollbackAllTransactions();
286
287  // Returns the current transaction nesting, which will be 0 if there are
288  // no open transactions.
289  int transaction_nesting() const { return transaction_nesting_; }
290
291  // Attached databases---------------------------------------------------------
292
293  // SQLite supports attaching multiple database files to a single
294  // handle.  Attach the database in |other_db_path| to the current
295  // handle under |attachment_point|.  |attachment_point| should only
296  // contain characters from [a-zA-Z0-9_].
297  //
298  // Note that calling attach or detach with an open transaction is an
299  // error.
300  bool AttachDatabase(const base::FilePath& other_db_path,
301                      const char* attachment_point);
302  bool DetachDatabase(const char* attachment_point);
303
304  // Statements ----------------------------------------------------------------
305
306  // Executes the given SQL string, returning true on success. This is
307  // normally used for simple, 1-off statements that don't take any bound
308  // parameters and don't return any data (e.g. CREATE TABLE).
309  //
310  // This will DCHECK if the |sql| contains errors.
311  //
312  // Do not use ignore_result() to ignore all errors.  Use
313  // ExecuteAndReturnErrorCode() and ignore only specific errors.
314  bool Execute(const char* sql) WARN_UNUSED_RESULT;
315
316  // Like Execute(), but returns the error code given by SQLite.
317  int ExecuteAndReturnErrorCode(const char* sql) WARN_UNUSED_RESULT;
318
319  // Returns true if we have a statement with the given identifier already
320  // cached. This is normally not necessary to call, but can be useful if the
321  // caller has to dynamically build up SQL to avoid doing so if it's already
322  // cached.
323  bool HasCachedStatement(const StatementID& id) const;
324
325  // Returns a statement for the given SQL using the statement cache. It can
326  // take a nontrivial amount of work to parse and compile a statement, so
327  // keeping commonly-used ones around for future use is important for
328  // performance.
329  //
330  // If the |sql| has an error, an invalid, inert StatementRef is returned (and
331  // the code will crash in debug). The caller must deal with this eventuality,
332  // either by checking validity of the |sql| before calling, by correctly
333  // handling the return of an inert statement, or both.
334  //
335  // The StatementID and the SQL must always correspond to one-another. The
336  // ID is the lookup into the cache, so crazy things will happen if you use
337  // different SQL with the same ID.
338  //
339  // You will normally use the SQL_FROM_HERE macro to generate a statement
340  // ID associated with the current line of code. This gives uniqueness without
341  // you having to manage unique names. See StatementID above for more.
342  //
343  // Example:
344  //   sql::Statement stmt(connection_.GetCachedStatement(
345  //       SQL_FROM_HERE, "SELECT * FROM foo"));
346  //   if (!stmt)
347  //     return false;  // Error creating statement.
348  scoped_refptr<StatementRef> GetCachedStatement(const StatementID& id,
349                                                 const char* sql);
350
351  // Used to check a |sql| statement for syntactic validity. If the statement is
352  // valid SQL, returns true.
353  bool IsSQLValid(const char* sql);
354
355  // Returns a non-cached statement for the given SQL. Use this for SQL that
356  // is only executed once or only rarely (there is overhead associated with
357  // keeping a statement cached).
358  //
359  // See GetCachedStatement above for examples and error information.
360  scoped_refptr<StatementRef> GetUniqueStatement(const char* sql);
361
362  // Info querying -------------------------------------------------------------
363
364  // Returns true if the given table exists.
365  bool DoesTableExist(const char* table_name) const;
366
367  // Returns true if the given index exists.
368  bool DoesIndexExist(const char* index_name) const;
369
370  // Returns true if a column with the given name exists in the given table.
371  bool DoesColumnExist(const char* table_name, const char* column_name) const;
372
373  // Returns sqlite's internal ID for the last inserted row. Valid only
374  // immediately after an insert.
375  int64 GetLastInsertRowId() const;
376
377  // Returns sqlite's count of the number of rows modified by the last
378  // statement executed. Will be 0 if no statement has executed or the database
379  // is closed.
380  int GetLastChangeCount() const;
381
382  // Errors --------------------------------------------------------------------
383
384  // Returns the error code associated with the last sqlite operation.
385  int GetErrorCode() const;
386
387  // Returns the errno associated with GetErrorCode().  See
388  // SQLITE_LAST_ERRNO in SQLite documentation.
389  int GetLastErrno() const;
390
391  // Returns a pointer to a statically allocated string associated with the
392  // last sqlite operation.
393  const char* GetErrorMessage() const;
394
395  // Return a reproducible representation of the schema equivalent to
396  // running the following statement at a sqlite3 command-line:
397  //   SELECT type, name, tbl_name, sql FROM sqlite_master ORDER BY 1, 2, 3, 4;
398  std::string GetSchema() const;
399
400  // Clients which provide an error_callback don't see the
401  // error-handling at the end of OnSqliteError().  Expose to allow
402  // those clients to work appropriately with ScopedErrorIgnorer in
403  // tests.
404  static bool ShouldIgnoreSqliteError(int error);
405
406 private:
407  // For recovery module.
408  friend class Recovery;
409
410  // Allow test-support code to set/reset error ignorer.
411  friend class ScopedErrorIgnorer;
412
413  // Statement accesses StatementRef which we don't want to expose to everybody
414  // (they should go through Statement).
415  friend class Statement;
416
417  // Internal initialize function used by both Init and InitInMemory. The file
418  // name is always 8 bits since we want to use the 8-bit version of
419  // sqlite3_open. The string can also be sqlite's special ":memory:" string.
420  //
421  // |retry_flag| controls retrying the open if the error callback
422  // addressed errors using RazeAndClose().
423  enum Retry {
424    NO_RETRY = 0,
425    RETRY_ON_POISON
426  };
427  bool OpenInternal(const std::string& file_name, Retry retry_flag);
428
429  // Internal close function used by Close() and RazeAndClose().
430  // |forced| indicates that orderly-shutdown checks should not apply.
431  void CloseInternal(bool forced);
432
433  // Check whether the current thread is allowed to make IO calls, but only
434  // if database wasn't open in memory. Function is inlined to be a no-op in
435  // official build.
436  void AssertIOAllowed() {
437    if (!in_memory_)
438      base::ThreadRestrictions::AssertIOAllowed();
439  }
440
441  // Internal helper for DoesTableExist and DoesIndexExist.
442  bool DoesTableOrIndexExist(const char* name, const char* type) const;
443
444  // Accessors for global error-ignorer, for injecting behavior during tests.
445  // See test/scoped_error_ignorer.h.
446  typedef base::Callback<bool(int)> ErrorIgnorerCallback;
447  static ErrorIgnorerCallback* current_ignorer_cb_;
448  static void SetErrorIgnorer(ErrorIgnorerCallback* ignorer);
449  static void ResetErrorIgnorer();
450
451  // A StatementRef is a refcounted wrapper around a sqlite statement pointer.
452  // Refcounting allows us to give these statements out to sql::Statement
453  // objects while also optionally maintaining a cache of compiled statements
454  // by just keeping a refptr to these objects.
455  //
456  // A statement ref can be valid, in which case it can be used, or invalid to
457  // indicate that the statement hasn't been created yet, has an error, or has
458  // been destroyed.
459  //
460  // The Connection may revoke a StatementRef in some error cases, so callers
461  // should always check validity before using.
462  class SQL_EXPORT StatementRef : public base::RefCounted<StatementRef> {
463   public:
464    // |connection| is the sql::Connection instance associated with
465    // the statement, and is used for tracking outstanding statements
466    // and for error handling.  Set to NULL for invalid or untracked
467    // refs.  |stmt| is the actual statement, and should only be NULL
468    // to create an invalid ref.  |was_valid| indicates whether the
469    // statement should be considered valid for diagnistic purposes.
470    // |was_valid| can be true for NULL |stmt| if the connection has
471    // been forcibly closed by an error handler.
472    StatementRef(Connection* connection, sqlite3_stmt* stmt, bool was_valid);
473
474    // When true, the statement can be used.
475    bool is_valid() const { return !!stmt_; }
476
477    // When true, the statement is either currently valid, or was
478    // previously valid but the connection was forcibly closed.  Used
479    // for diagnostic checks.
480    bool was_valid() const { return was_valid_; }
481
482    // If we've not been linked to a connection, this will be NULL.
483    // TODO(shess): connection_ can be NULL in case of GetUntrackedStatement(),
484    // which prevents Statement::OnError() from forwarding errors.
485    Connection* connection() const { return connection_; }
486
487    // Returns the sqlite statement if any. If the statement is not active,
488    // this will return NULL.
489    sqlite3_stmt* stmt() const { return stmt_; }
490
491    // Destroys the compiled statement and marks it NULL. The statement will
492    // no longer be active.  |forced| is used to indicate if orderly-shutdown
493    // checks should apply (see Connection::RazeAndClose()).
494    void Close(bool forced);
495
496    // Check whether the current thread is allowed to make IO calls, but only
497    // if database wasn't open in memory.
498    void AssertIOAllowed() { if (connection_) connection_->AssertIOAllowed(); }
499
500   private:
501    friend class base::RefCounted<StatementRef>;
502
503    ~StatementRef();
504
505    Connection* connection_;
506    sqlite3_stmt* stmt_;
507    bool was_valid_;
508
509    DISALLOW_COPY_AND_ASSIGN(StatementRef);
510  };
511  friend class StatementRef;
512
513  // Executes a rollback statement, ignoring all transaction state. Used
514  // internally in the transaction management code.
515  void DoRollback();
516
517  // Called by a StatementRef when it's being created or destroyed. See
518  // open_statements_ below.
519  void StatementRefCreated(StatementRef* ref);
520  void StatementRefDeleted(StatementRef* ref);
521
522  // Called when a sqlite function returns an error, which is passed
523  // as |err|.  The return value is the error code to be reflected
524  // back to client code.  |stmt| is non-NULL if the error relates to
525  // an sql::Statement instance.  |sql| is non-NULL if the error
526  // relates to non-statement sql code (Execute, for instance).  Both
527  // can be NULL, but both should never be set.
528  // NOTE(shess): Originally, the return value was intended to allow
529  // error handlers to transparently convert errors into success.
530  // Unfortunately, transactions are not generally restartable, so
531  // this did not work out.
532  int OnSqliteError(int err, Statement* stmt, const char* sql);
533
534  // Like |Execute()|, but retries if the database is locked.
535  bool ExecuteWithTimeout(const char* sql, base::TimeDelta ms_timeout)
536      WARN_UNUSED_RESULT;
537
538  // Internal helper for const functions.  Like GetUniqueStatement(),
539  // except the statement is not entered into open_statements_,
540  // allowing this function to be const.  Open statements can block
541  // closing the database, so only use in cases where the last ref is
542  // released before close could be called (which should always be the
543  // case for const functions).
544  scoped_refptr<StatementRef> GetUntrackedStatement(const char* sql) const;
545
546  bool IntegrityCheckHelper(
547      const char* pragma_sql,
548      std::vector<std::string>* messages) WARN_UNUSED_RESULT;
549
550  // The actual sqlite database. Will be NULL before Init has been called or if
551  // Init resulted in an error.
552  sqlite3* db_;
553
554  // Parameters we'll configure in sqlite before doing anything else. Zero means
555  // use the default value.
556  int page_size_;
557  int cache_size_;
558  bool exclusive_locking_;
559  bool restrict_to_user_;
560
561  // All cached statements. Keeping a reference to these statements means that
562  // they'll remain active.
563  typedef std::map<StatementID, scoped_refptr<StatementRef> >
564      CachedStatementMap;
565  CachedStatementMap statement_cache_;
566
567  // A list of all StatementRefs we've given out. Each ref must register with
568  // us when it's created or destroyed. This allows us to potentially close
569  // any open statements when we encounter an error.
570  typedef std::set<StatementRef*> StatementRefSet;
571  StatementRefSet open_statements_;
572
573  // Number of currently-nested transactions.
574  int transaction_nesting_;
575
576  // True if any of the currently nested transactions have been rolled back.
577  // When we get to the outermost transaction, this will determine if we do
578  // a rollback instead of a commit.
579  bool needs_rollback_;
580
581  // True if database is open with OpenInMemory(), False if database is open
582  // with Open().
583  bool in_memory_;
584
585  // |true| if the connection was closed using RazeAndClose().  Used
586  // to enable diagnostics to distinguish calls to never-opened
587  // databases (incorrect use of the API) from calls to once-valid
588  // databases.
589  bool poisoned_;
590
591  ErrorCallback error_callback_;
592
593  // Tag for auxiliary histograms.
594  std::string histogram_tag_;
595
596  DISALLOW_COPY_AND_ASSIGN(Connection);
597};
598
599}  // namespace sql
600
601#endif  // SQL_CONNECTION_H_
602