2009-10-20 21:03:30 -07:00
|
|
|
/* database-private.h - For peeking into the internals of notmuch_database_t
|
|
|
|
*
|
|
|
|
* Copyright © 2009 Carl Worth
|
|
|
|
*
|
|
|
|
* This program is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
|
|
* (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
2016-06-02 12:26:14 -04:00
|
|
|
* along with this program. If not, see https://www.gnu.org/licenses/ .
|
2009-10-20 21:03:30 -07:00
|
|
|
*
|
|
|
|
* Author: Carl Worth <cworth@cworth.org>
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef NOTMUCH_DATABASE_PRIVATE_H
|
|
|
|
#define NOTMUCH_DATABASE_PRIVATE_H
|
|
|
|
|
2010-02-09 11:09:30 -08:00
|
|
|
/* According to WG14/N1124, a C++ implementation won't provide us a
|
|
|
|
* macro like PRIx64 (which gives a printf format string for
|
|
|
|
* formatting a uint64_t as hexadecimal) unless we define
|
|
|
|
* __STDC_FORMAT_MACROS before including inttypes.h. That's annoying,
|
|
|
|
* but there it is.
|
|
|
|
*/
|
|
|
|
#define __STDC_FORMAT_MACROS
|
|
|
|
#include <inttypes.h>
|
|
|
|
|
2009-10-20 21:03:30 -07:00
|
|
|
#include "notmuch-private.h"
|
|
|
|
|
2016-10-05 08:34:34 -03:00
|
|
|
#ifdef SILENCE_XAPIAN_DEPRECATION_WARNINGS
|
|
|
|
#define XAPIAN_DEPRECATED(D) D
|
|
|
|
#endif
|
|
|
|
|
2009-10-20 21:03:30 -07:00
|
|
|
#include <xapian.h>
|
|
|
|
|
lib: Database version 3: Introduce fine-grained "features"
Previously, our database schema was versioned by a single number.
Each database schema change had to occur "atomically" in Notmuch's
development history: before some commit, Notmuch used version N, after
that commit, it used version N+1. Hence, each new schema version
could introduce only one change, the task of developing a schema
change fell on a single person, and it all had to happen and be
perfect in a single commit series. This made introducing a new schema
version hard. We've seen only two schema changes in the history of
Notmuch.
This commit introduces database schema version 3; hopefully the last
schema version we'll need for a while. With this version, we switch
from a single version number to "features": a set of named,
independent aspects of the database schema.
Features should make backwards compatibility easier. For many things,
it should be easy to support databases both with and without a
feature, which will allow us to make upgrades optional and will enable
"unstable" features that can be developed and tested over time.
Features also make forwards compatibility easier. The features
recorded in a database include "compatibility flags," which can
indicate to an older version of Notmuch when it must support a given
feature to open the database for read or for write. This lets us
replace the old vague "I don't recognize this version, so something
might go wrong, but I promise to try my best" warnings upon opening a
database with an unknown version with precise errors. If a database
is safe to open for read/write despite unknown features, an older
version will know that and issue no message at all. If the database
is not safe to open for read/write because of unknown features, an
older version will know that, too, and can tell the user exactly which
required features it lacks support for.
2014-08-25 13:26:00 -04:00
|
|
|
/* Bit masks for _notmuch_database::features. Features are named,
|
|
|
|
* independent aspects of the database schema.
|
|
|
|
*
|
|
|
|
* A database stores the set of features that it "uses" (implicitly
|
|
|
|
* before database version 3 and explicitly as of version 3).
|
|
|
|
*
|
|
|
|
* A given library version will "recognize" a particular set of
|
|
|
|
* features; if a database uses a feature that the library does not
|
|
|
|
* recognize, the library will refuse to open it. It is assumed the
|
|
|
|
* set of recognized features grows monotonically over time. A
|
|
|
|
* library version will "implement" some subset of the recognized
|
|
|
|
* features: some operations may require that the database use (or not
|
|
|
|
* use) some feature, while other operations may support both
|
|
|
|
* databases that use and that don't use some feature.
|
|
|
|
*
|
|
|
|
* On disk, the database stores string names for these features (see
|
|
|
|
* the feature_names array). These enum bit values are never
|
|
|
|
* persisted to disk and may change freely.
|
|
|
|
*/
|
|
|
|
enum _notmuch_features {
|
|
|
|
/* If set, file names are stored in "file-direntry" terms. If
|
|
|
|
* unset, file names are stored in document data.
|
|
|
|
*
|
|
|
|
* Introduced: version 1. */
|
|
|
|
NOTMUCH_FEATURE_FILE_TERMS = 1 << 0,
|
|
|
|
|
|
|
|
/* If set, directory timestamps are stored in documents with
|
|
|
|
* XDIRECTORY terms and relative paths. If unset, directory
|
|
|
|
* timestamps are stored in documents with XTIMESTAMP terms and
|
|
|
|
* absolute paths.
|
|
|
|
*
|
|
|
|
* Introduced: version 1. */
|
|
|
|
NOTMUCH_FEATURE_DIRECTORY_DOCS = 1 << 1,
|
|
|
|
|
|
|
|
/* If set, the from, subject, and message-id headers are stored in
|
|
|
|
* message document values. If unset, message documents *may*
|
|
|
|
* have these values, but if the value is empty, it must be
|
|
|
|
* retrieved from the message file.
|
|
|
|
*
|
|
|
|
* Introduced: optional in version 1, required as of version 3.
|
|
|
|
*/
|
|
|
|
NOTMUCH_FEATURE_FROM_SUBJECT_ID_VALUES = 1 << 2,
|
|
|
|
|
|
|
|
/* If set, folder terms are boolean and path terms exist. If
|
|
|
|
* unset, folder terms are probabilistic and stemmed and path
|
|
|
|
* terms do not exist.
|
|
|
|
*
|
|
|
|
* Introduced: version 2. */
|
|
|
|
NOTMUCH_FEATURE_BOOL_FOLDER = 1 << 3,
|
2014-10-23 08:30:33 -04:00
|
|
|
|
|
|
|
/* If set, missing messages are stored in ghost mail documents.
|
|
|
|
* If unset, thread IDs of ghost messages are stored as database
|
|
|
|
* metadata instead of in ghost documents.
|
|
|
|
*
|
|
|
|
* Introduced: version 3. */
|
|
|
|
NOTMUCH_FEATURE_GHOSTS = 1 << 4,
|
2015-01-22 17:43:37 -06:00
|
|
|
|
|
|
|
|
|
|
|
/* If set, then the database was created after the introduction of
|
|
|
|
* indexed mime types. If unset, then the database may contain a
|
|
|
|
* mixture of messages with indexed and non-indexed mime types.
|
|
|
|
*
|
|
|
|
* Introduced: version 3. */
|
|
|
|
NOTMUCH_FEATURE_INDEXED_MIMETYPES = 1 << 5,
|
lib: Add per-message last modification tracking
This adds a new document value that stores the revision of the last
modification to message metadata, where the revision number increases
monotonically with each database commit.
An alternative would be to store the wall-clock time of the last
modification of each message. In principle this is simpler and has
the advantage that any process can determine the current timestamp
without support from libnotmuch. However, even assuming a computer's
clock never goes backward and ignoring clock skew in networked
environments, this has a fatal flaw. Xapian uses (optimistic)
snapshot isolation, which means reads can be concurrent with writes.
Given this, consider the following time line with a write and two read
transactions:
write |-X-A--------------|
read 1 |---B---|
read 2 |---|
The write transaction modifies message X and records the wall-clock
time of the modification at A. The writer hangs around for a while
and later commits its change. Read 1 is concurrent with the write, so
it doesn't see the change to X. It does some query and records the
wall-clock time of its results at B. Transaction read 2 later starts
after the write commits and queries for changes since wall-clock time
B (say the reads are performing an incremental backup). Even though
read 1 could not see the change to X, read 2 is told (correctly) that
X has not changed since B, the time of the last read. In fact, X
changed before wall-clock time A, but the change was not visible until
*after* wall-clock time B, so read 2 misses the change to X.
This is tricky to solve in full-blown snapshot isolation, but because
Xapian serializes writes, we can use a simple, monotonically
increasing database revision number. Furthermore, maintaining this
revision number requires no more IO than a wall-clock time solution
because Xapian already maintains statistics on the upper (and lower)
bound of each value stream.
2014-10-13 02:20:01 -04:00
|
|
|
|
|
|
|
/* If set, messages store the revision number of the last
|
|
|
|
* modification in NOTMUCH_VALUE_LAST_MOD.
|
|
|
|
*
|
|
|
|
* Introduced: version 3. */
|
|
|
|
NOTMUCH_FEATURE_LAST_MOD = 1 << 6,
|
lib: Database version 3: Introduce fine-grained "features"
Previously, our database schema was versioned by a single number.
Each database schema change had to occur "atomically" in Notmuch's
development history: before some commit, Notmuch used version N, after
that commit, it used version N+1. Hence, each new schema version
could introduce only one change, the task of developing a schema
change fell on a single person, and it all had to happen and be
perfect in a single commit series. This made introducing a new schema
version hard. We've seen only two schema changes in the history of
Notmuch.
This commit introduces database schema version 3; hopefully the last
schema version we'll need for a while. With this version, we switch
from a single version number to "features": a set of named,
independent aspects of the database schema.
Features should make backwards compatibility easier. For many things,
it should be easy to support databases both with and without a
feature, which will allow us to make upgrades optional and will enable
"unstable" features that can be developed and tested over time.
Features also make forwards compatibility easier. The features
recorded in a database include "compatibility flags," which can
indicate to an older version of Notmuch when it must support a given
feature to open the database for read or for write. This lets us
replace the old vague "I don't recognize this version, so something
might go wrong, but I promise to try my best" warnings upon opening a
database with an unknown version with precise errors. If a database
is safe to open for read/write despite unknown features, an older
version will know that and issue no message at all. If the database
is not safe to open for read/write because of unknown features, an
older version will know that, too, and can tell the user exactly which
required features it lacks support for.
2014-08-25 13:26:00 -04:00
|
|
|
};
|
|
|
|
|
|
|
|
/* In C++, a named enum is its own type, so define bitwise operators
|
|
|
|
* on _notmuch_features. */
|
|
|
|
inline _notmuch_features
|
|
|
|
operator|(_notmuch_features a, _notmuch_features b)
|
|
|
|
{
|
|
|
|
return static_cast<_notmuch_features>(
|
|
|
|
static_cast<unsigned>(a) | static_cast<unsigned>(b));
|
|
|
|
}
|
|
|
|
|
|
|
|
inline _notmuch_features
|
|
|
|
operator&(_notmuch_features a, _notmuch_features b)
|
|
|
|
{
|
|
|
|
return static_cast<_notmuch_features>(
|
|
|
|
static_cast<unsigned>(a) & static_cast<unsigned>(b));
|
|
|
|
}
|
|
|
|
|
|
|
|
inline _notmuch_features
|
|
|
|
operator~(_notmuch_features a)
|
|
|
|
{
|
|
|
|
return static_cast<_notmuch_features>(~static_cast<unsigned>(a));
|
|
|
|
}
|
|
|
|
|
|
|
|
inline _notmuch_features&
|
|
|
|
operator|=(_notmuch_features &a, _notmuch_features b)
|
|
|
|
{
|
|
|
|
a = a | b;
|
|
|
|
return a;
|
|
|
|
}
|
|
|
|
|
|
|
|
inline _notmuch_features&
|
|
|
|
operator&=(_notmuch_features &a, _notmuch_features b)
|
|
|
|
{
|
|
|
|
a = a & b;
|
|
|
|
return a;
|
|
|
|
}
|
|
|
|
|
2017-02-16 23:07:49 -04:00
|
|
|
/*
|
|
|
|
* Configuration options for xapian database fields */
|
|
|
|
typedef enum notmuch_field_flags {
|
|
|
|
NOTMUCH_FIELD_NO_FLAGS = 0,
|
|
|
|
NOTMUCH_FIELD_EXTERNAL = 1 << 0,
|
2017-02-26 22:34:19 -04:00
|
|
|
NOTMUCH_FIELD_PROBABILISTIC = 1 << 1,
|
|
|
|
NOTMUCH_FIELD_PROCESSOR = 1 << 2,
|
2017-02-16 23:07:49 -04:00
|
|
|
} notmuch_field_flag_t;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* define bitwise operators to hide casts */
|
|
|
|
inline notmuch_field_flag_t
|
|
|
|
operator|(notmuch_field_flag_t a, notmuch_field_flag_t b)
|
|
|
|
{
|
|
|
|
return static_cast<notmuch_field_flag_t>(
|
|
|
|
static_cast<unsigned>(a) | static_cast<unsigned>(b));
|
|
|
|
}
|
|
|
|
|
|
|
|
inline notmuch_field_flag_t
|
|
|
|
operator&(notmuch_field_flag_t a, notmuch_field_flag_t b)
|
|
|
|
{
|
|
|
|
return static_cast<notmuch_field_flag_t>(
|
|
|
|
static_cast<unsigned>(a) & static_cast<unsigned>(b));
|
|
|
|
}
|
|
|
|
|
2016-03-22 07:54:53 -03:00
|
|
|
#define NOTMUCH_QUERY_PARSER_FLAGS (Xapian::QueryParser::FLAG_BOOLEAN | \
|
|
|
|
Xapian::QueryParser::FLAG_PHRASE | \
|
|
|
|
Xapian::QueryParser::FLAG_LOVEHATE | \
|
|
|
|
Xapian::QueryParser::FLAG_BOOLEAN_ANY_CASE | \
|
|
|
|
Xapian::QueryParser::FLAG_WILDCARD | \
|
|
|
|
Xapian::QueryParser::FLAG_PURE_NOT)
|
|
|
|
|
2009-10-20 21:03:30 -07:00
|
|
|
struct _notmuch_database {
|
2017-10-07 11:44:05 +03:00
|
|
|
bool exception_reported;
|
2010-02-08 11:33:33 -08:00
|
|
|
|
2009-10-20 21:03:30 -07:00
|
|
|
char *path;
|
2010-02-08 11:33:33 -08:00
|
|
|
|
2009-11-21 19:54:25 +00:00
|
|
|
notmuch_database_mode_t mode;
|
2011-06-10 23:35:06 -04:00
|
|
|
int atomic_nesting;
|
2017-10-07 11:44:05 +03:00
|
|
|
/* true if changes have been made in this atomic section */
|
|
|
|
bool atomic_dirty;
|
2009-11-21 19:54:25 +00:00
|
|
|
Xapian::Database *xapian_db;
|
2010-02-08 11:33:33 -08:00
|
|
|
|
lib: Database version 3: Introduce fine-grained "features"
Previously, our database schema was versioned by a single number.
Each database schema change had to occur "atomically" in Notmuch's
development history: before some commit, Notmuch used version N, after
that commit, it used version N+1. Hence, each new schema version
could introduce only one change, the task of developing a schema
change fell on a single person, and it all had to happen and be
perfect in a single commit series. This made introducing a new schema
version hard. We've seen only two schema changes in the history of
Notmuch.
This commit introduces database schema version 3; hopefully the last
schema version we'll need for a while. With this version, we switch
from a single version number to "features": a set of named,
independent aspects of the database schema.
Features should make backwards compatibility easier. For many things,
it should be easy to support databases both with and without a
feature, which will allow us to make upgrades optional and will enable
"unstable" features that can be developed and tested over time.
Features also make forwards compatibility easier. The features
recorded in a database include "compatibility flags," which can
indicate to an older version of Notmuch when it must support a given
feature to open the database for read or for write. This lets us
replace the old vague "I don't recognize this version, so something
might go wrong, but I promise to try my best" warnings upon opening a
database with an unknown version with precise errors. If a database
is safe to open for read/write despite unknown features, an older
version will know that and issue no message at all. If the database
is not safe to open for read/write because of unknown features, an
older version will know that, too, and can tell the user exactly which
required features it lacks support for.
2014-08-25 13:26:00 -04:00
|
|
|
/* Bit mask of features used by this database. This is a
|
|
|
|
* bitwise-OR of NOTMUCH_FEATURE_* values (above). */
|
|
|
|
enum _notmuch_features features;
|
|
|
|
|
2010-06-04 10:16:53 -07:00
|
|
|
unsigned int last_doc_id;
|
2010-02-08 11:33:33 -08:00
|
|
|
uint64_t last_thread_id;
|
|
|
|
|
2014-12-26 09:01:01 +01:00
|
|
|
/* error reporting; this value persists only until the
|
|
|
|
* next library call. May be NULL */
|
|
|
|
char *status_string;
|
|
|
|
|
lib: Add per-message last modification tracking
This adds a new document value that stores the revision of the last
modification to message metadata, where the revision number increases
monotonically with each database commit.
An alternative would be to store the wall-clock time of the last
modification of each message. In principle this is simpler and has
the advantage that any process can determine the current timestamp
without support from libnotmuch. However, even assuming a computer's
clock never goes backward and ignoring clock skew in networked
environments, this has a fatal flaw. Xapian uses (optimistic)
snapshot isolation, which means reads can be concurrent with writes.
Given this, consider the following time line with a write and two read
transactions:
write |-X-A--------------|
read 1 |---B---|
read 2 |---|
The write transaction modifies message X and records the wall-clock
time of the modification at A. The writer hangs around for a while
and later commits its change. Read 1 is concurrent with the write, so
it doesn't see the change to X. It does some query and records the
wall-clock time of its results at B. Transaction read 2 later starts
after the write commits and queries for changes since wall-clock time
B (say the reads are performing an incremental backup). Even though
read 1 could not see the change to X, read 2 is told (correctly) that
X has not changed since B, the time of the last read. In fact, X
changed before wall-clock time A, but the change was not visible until
*after* wall-clock time B, so read 2 misses the change to X.
This is tricky to solve in full-blown snapshot isolation, but because
Xapian serializes writes, we can use a simple, monotonically
increasing database revision number. Furthermore, maintaining this
revision number requires no more IO than a wall-clock time solution
because Xapian already maintains statistics on the upper (and lower)
bound of each value stream.
2014-10-13 02:20:01 -04:00
|
|
|
/* Highest committed revision number. Modifications are recorded
|
|
|
|
* under a higher revision number, which can be generated with
|
|
|
|
* notmuch_database_new_revision. */
|
|
|
|
unsigned long revision;
|
2014-10-13 02:20:02 -04:00
|
|
|
const char *uuid;
|
lib: Add per-message last modification tracking
This adds a new document value that stores the revision of the last
modification to message metadata, where the revision number increases
monotonically with each database commit.
An alternative would be to store the wall-clock time of the last
modification of each message. In principle this is simpler and has
the advantage that any process can determine the current timestamp
without support from libnotmuch. However, even assuming a computer's
clock never goes backward and ignoring clock skew in networked
environments, this has a fatal flaw. Xapian uses (optimistic)
snapshot isolation, which means reads can be concurrent with writes.
Given this, consider the following time line with a write and two read
transactions:
write |-X-A--------------|
read 1 |---B---|
read 2 |---|
The write transaction modifies message X and records the wall-clock
time of the modification at A. The writer hangs around for a while
and later commits its change. Read 1 is concurrent with the write, so
it doesn't see the change to X. It does some query and records the
wall-clock time of its results at B. Transaction read 2 later starts
after the write commits and queries for changes since wall-clock time
B (say the reads are performing an incremental backup). Even though
read 1 could not see the change to X, read 2 is told (correctly) that
X has not changed since B, the time of the last read. In fact, X
changed before wall-clock time A, but the change was not visible until
*after* wall-clock time B, so read 2 misses the change to X.
This is tricky to solve in full-blown snapshot isolation, but because
Xapian serializes writes, we can use a simple, monotonically
increasing database revision number. Furthermore, maintaining this
revision number requires no more IO than a wall-clock time solution
because Xapian already maintains statistics on the upper (and lower)
bound of each value stream.
2014-10-13 02:20:01 -04:00
|
|
|
|
2017-02-23 21:38:24 -04:00
|
|
|
/* Keep track of the number of times the database has been re-opened
|
|
|
|
* (or other global invalidations of notmuch's caching)
|
|
|
|
*/
|
|
|
|
unsigned long view;
|
2009-10-21 00:35:56 -07:00
|
|
|
Xapian::QueryParser *query_parser;
|
2009-10-28 10:42:07 -07:00
|
|
|
Xapian::TermGenerator *term_gen;
|
2009-11-23 16:58:35 +01:00
|
|
|
Xapian::ValueRangeProcessor *value_range_processor;
|
lib: add date range query support
Add a custom value range processor to enable date and time searches of
the form date:since..until, where "since" and "until" are expressions
understood by the previously added date/time parser, to restrict the
results to messages within a particular time range (based on the Date:
header).
If "since" or "until" describes date/time at an accuracy of days or
less, the values are rounded according to the accuracy, towards past
for "since" and towards future for "until". For example,
date:november..yesterday would match from the beginning of November
until the end of yesterday. Expressions such as date:today..today
means since the beginning of today until the end of today.
Open-ended ranges are supported (since Xapian 1.2.1), i.e. you can
specify date:..until or date:since.. to not limit the start or end
date, respectively.
CAVEATS:
Xapian does not support spaces in range expressions. You can replace
the spaces with '_', or (in most cases) '-', or (in some cases) leave
the spaces out altogether.
Entering date:expr without ".." (for example date:yesterday) will not
work as you might expect. You can achieve the expected result by
duplicating the expr both sides of ".." (for example
date:yesterday..yesterday).
Open-ended ranges won't work with pre-1.2.1 Xapian, but they don't
produce an error either.
Signed-off-by: Jani Nikula <jani@nikula.org>
2012-10-30 22:32:37 +02:00
|
|
|
Xapian::ValueRangeProcessor *date_range_processor;
|
2014-10-13 02:20:03 -04:00
|
|
|
Xapian::ValueRangeProcessor *last_mod_range_processor;
|
2009-10-20 21:03:30 -07:00
|
|
|
};
|
|
|
|
|
lib: Database version 3: Introduce fine-grained "features"
Previously, our database schema was versioned by a single number.
Each database schema change had to occur "atomically" in Notmuch's
development history: before some commit, Notmuch used version N, after
that commit, it used version N+1. Hence, each new schema version
could introduce only one change, the task of developing a schema
change fell on a single person, and it all had to happen and be
perfect in a single commit series. This made introducing a new schema
version hard. We've seen only two schema changes in the history of
Notmuch.
This commit introduces database schema version 3; hopefully the last
schema version we'll need for a while. With this version, we switch
from a single version number to "features": a set of named,
independent aspects of the database schema.
Features should make backwards compatibility easier. For many things,
it should be easy to support databases both with and without a
feature, which will allow us to make upgrades optional and will enable
"unstable" features that can be developed and tested over time.
Features also make forwards compatibility easier. The features
recorded in a database include "compatibility flags," which can
indicate to an older version of Notmuch when it must support a given
feature to open the database for read or for write. This lets us
replace the old vague "I don't recognize this version, so something
might go wrong, but I promise to try my best" warnings upon opening a
database with an unknown version with precise errors. If a database
is safe to open for read/write despite unknown features, an older
version will know that and issue no message at all. If the database
is not safe to open for read/write because of unknown features, an
older version will know that, too, and can tell the user exactly which
required features it lacks support for.
2014-08-25 13:26:00 -04:00
|
|
|
/* Prior to database version 3, features were implied by the database
|
|
|
|
* version number, so hard-code them for earlier versions. */
|
|
|
|
#define NOTMUCH_FEATURES_V0 ((enum _notmuch_features)0)
|
|
|
|
#define NOTMUCH_FEATURES_V1 (NOTMUCH_FEATURES_V0 | NOTMUCH_FEATURE_FILE_TERMS | \
|
|
|
|
NOTMUCH_FEATURE_DIRECTORY_DOCS)
|
|
|
|
#define NOTMUCH_FEATURES_V2 (NOTMUCH_FEATURES_V1 | NOTMUCH_FEATURE_BOOL_FOLDER)
|
|
|
|
|
|
|
|
/* Current database features. If any of these are missing from a
|
|
|
|
* database, request an upgrade.
|
2015-01-22 17:43:37 -06:00
|
|
|
* NOTMUCH_FEATURE_FROM_SUBJECT_ID_VALUES and
|
|
|
|
* NOTMUCH_FEATURE_INDEXED_MIMETYPES are not included because upgrade
|
|
|
|
* doesn't currently introduce the features (though brand new databases
|
|
|
|
* will have it). */
|
lib: Database version 3: Introduce fine-grained "features"
Previously, our database schema was versioned by a single number.
Each database schema change had to occur "atomically" in Notmuch's
development history: before some commit, Notmuch used version N, after
that commit, it used version N+1. Hence, each new schema version
could introduce only one change, the task of developing a schema
change fell on a single person, and it all had to happen and be
perfect in a single commit series. This made introducing a new schema
version hard. We've seen only two schema changes in the history of
Notmuch.
This commit introduces database schema version 3; hopefully the last
schema version we'll need for a while. With this version, we switch
from a single version number to "features": a set of named,
independent aspects of the database schema.
Features should make backwards compatibility easier. For many things,
it should be easy to support databases both with and without a
feature, which will allow us to make upgrades optional and will enable
"unstable" features that can be developed and tested over time.
Features also make forwards compatibility easier. The features
recorded in a database include "compatibility flags," which can
indicate to an older version of Notmuch when it must support a given
feature to open the database for read or for write. This lets us
replace the old vague "I don't recognize this version, so something
might go wrong, but I promise to try my best" warnings upon opening a
database with an unknown version with precise errors. If a database
is safe to open for read/write despite unknown features, an older
version will know that and issue no message at all. If the database
is not safe to open for read/write because of unknown features, an
older version will know that, too, and can tell the user exactly which
required features it lacks support for.
2014-08-25 13:26:00 -04:00
|
|
|
#define NOTMUCH_FEATURES_CURRENT \
|
|
|
|
(NOTMUCH_FEATURE_FILE_TERMS | NOTMUCH_FEATURE_DIRECTORY_DOCS | \
|
lib: Add per-message last modification tracking
This adds a new document value that stores the revision of the last
modification to message metadata, where the revision number increases
monotonically with each database commit.
An alternative would be to store the wall-clock time of the last
modification of each message. In principle this is simpler and has
the advantage that any process can determine the current timestamp
without support from libnotmuch. However, even assuming a computer's
clock never goes backward and ignoring clock skew in networked
environments, this has a fatal flaw. Xapian uses (optimistic)
snapshot isolation, which means reads can be concurrent with writes.
Given this, consider the following time line with a write and two read
transactions:
write |-X-A--------------|
read 1 |---B---|
read 2 |---|
The write transaction modifies message X and records the wall-clock
time of the modification at A. The writer hangs around for a while
and later commits its change. Read 1 is concurrent with the write, so
it doesn't see the change to X. It does some query and records the
wall-clock time of its results at B. Transaction read 2 later starts
after the write commits and queries for changes since wall-clock time
B (say the reads are performing an incremental backup). Even though
read 1 could not see the change to X, read 2 is told (correctly) that
X has not changed since B, the time of the last read. In fact, X
changed before wall-clock time A, but the change was not visible until
*after* wall-clock time B, so read 2 misses the change to X.
This is tricky to solve in full-blown snapshot isolation, but because
Xapian serializes writes, we can use a simple, monotonically
increasing database revision number. Furthermore, maintaining this
revision number requires no more IO than a wall-clock time solution
because Xapian already maintains statistics on the upper (and lower)
bound of each value stream.
2014-10-13 02:20:01 -04:00
|
|
|
NOTMUCH_FEATURE_BOOL_FOLDER | NOTMUCH_FEATURE_GHOSTS | \
|
|
|
|
NOTMUCH_FEATURE_LAST_MOD)
|
lib: Database version 3: Introduce fine-grained "features"
Previously, our database schema was versioned by a single number.
Each database schema change had to occur "atomically" in Notmuch's
development history: before some commit, Notmuch used version N, after
that commit, it used version N+1. Hence, each new schema version
could introduce only one change, the task of developing a schema
change fell on a single person, and it all had to happen and be
perfect in a single commit series. This made introducing a new schema
version hard. We've seen only two schema changes in the history of
Notmuch.
This commit introduces database schema version 3; hopefully the last
schema version we'll need for a while. With this version, we switch
from a single version number to "features": a set of named,
independent aspects of the database schema.
Features should make backwards compatibility easier. For many things,
it should be easy to support databases both with and without a
feature, which will allow us to make upgrades optional and will enable
"unstable" features that can be developed and tested over time.
Features also make forwards compatibility easier. The features
recorded in a database include "compatibility flags," which can
indicate to an older version of Notmuch when it must support a given
feature to open the database for read or for write. This lets us
replace the old vague "I don't recognize this version, so something
might go wrong, but I promise to try my best" warnings upon opening a
database with an unknown version with precise errors. If a database
is safe to open for read/write despite unknown features, an older
version will know that and issue no message at all. If the database
is not safe to open for read/write because of unknown features, an
older version will know that, too, and can tell the user exactly which
required features it lacks support for.
2014-08-25 13:26:00 -04:00
|
|
|
|
2010-12-09 00:32:35 -05:00
|
|
|
/* Return the list of terms from the given iterator matching a prefix.
|
|
|
|
* The prefix will be stripped from the strings in the returned list.
|
|
|
|
* The list will be allocated using ctx as the talloc context.
|
2009-11-23 01:10:54 +01:00
|
|
|
*
|
|
|
|
* The function returns NULL on failure.
|
|
|
|
*/
|
2010-12-09 00:32:35 -05:00
|
|
|
notmuch_string_list_t *
|
|
|
|
_notmuch_database_get_terms_with_prefix (void *ctx, Xapian::TermIterator &i,
|
|
|
|
Xapian::TermIterator &end,
|
|
|
|
const char *prefix);
|
2009-11-23 01:10:54 +01:00
|
|
|
|
2017-06-04 09:32:24 -03:00
|
|
|
void
|
|
|
|
_notmuch_database_find_doc_ids (notmuch_database_t *notmuch,
|
|
|
|
const char *prefix_name,
|
|
|
|
const char *value,
|
|
|
|
Xapian::PostingIterator *begin,
|
|
|
|
Xapian::PostingIterator *end);
|
2009-10-20 21:03:30 -07:00
|
|
|
#endif
|