Skip to content

Commit

Permalink
Merge pull request #2009 from Expensify/flo_checkpointer
Browse files Browse the repository at this point in the history
Allow passing a different checkpoint mode via CLI arguments
  • Loading branch information
tylerkaraszewski authored Dec 17, 2024
2 parents 5af420e + 3df5fdf commit a74a5d6
Show file tree
Hide file tree
Showing 6 changed files with 46 additions and 13 deletions.
8 changes: 4 additions & 4 deletions BedrockServer.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -97,7 +97,7 @@ void BedrockServer::sync()
// We use fewer FDs on test machines that have other resource restrictions in place.

SINFO("Setting dbPool size to: " << _dbPoolSize);
_dbPool = make_shared<SQLitePool>(_dbPoolSize, args["-db"], args.calc("-cacheSize"), args.calc("-maxJournalSize"), journalTables, mmapSizeGB, args.isSet("-hctree"));
_dbPool = make_shared<SQLitePool>(_dbPoolSize, args["-db"], args.calc("-cacheSize"), args.calc("-maxJournalSize"), journalTables, mmapSizeGB, args.isSet("-hctree"), args["-checkpointMode"]);
SQLite& db = _dbPool->getBase();

// Initialize the command processor.
Expand Down Expand Up @@ -358,7 +358,7 @@ void BedrockServer::sync()
committingCommand = true;
_syncNode->startCommit(SQLiteNode::QUORUM);
_lastQuorumCommandTime = STimeNow();

// This interrupts the next poll loop immediately. This prevents a 1-second wait when running as a single server.
_notifyDoneSync.push(true);
SDEBUG("Finished sending distributed transaction for db upgrade.");
Expand Down Expand Up @@ -1695,14 +1695,14 @@ void BedrockServer::_status(unique_ptr<BedrockCommand>& command) {
size_t totalCount = 0;
for (const auto& s : _crashCommands) {
totalCount += s.second.size();

vector<string> paramsArray;
for (const STable& params : s.second) {
if (!params.empty()) {
paramsArray.push_back(SComposeJSONObject(params));
}
}

STable commandObject;
commandObject[s.first] = SComposeJSONArray(paramsArray);
crashCommandListArray.push_back(SComposeJSONObject(commandObject));
Expand Down
4 changes: 4 additions & 0 deletions main.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -236,6 +236,7 @@ int main(int argc, char* argv[]) {
<< endl;
cout << "-maxJournalSize <#commits> Number of commits to retain in the historical journal (default 1000000)"
<< endl;
cout << "-checkpointMode <mode> Accepts PASSIVE|FULL|RESTART|TRUNCATE, which is the value passed to https://www.sqlite.org/c3ref/wal_checkpoint_v2.html" << endl;
cout << endl;
cout << "Quick Start Tips:" << endl;
cout << "-----------------" << endl;
Expand Down Expand Up @@ -300,6 +301,9 @@ int main(int argc, char* argv[]) {
SETDEFAULT("-queryLog", "queryLog.csv");
SETDEFAULT("-enableMultiWrite", "true");

// We default to PASSIVE checkpoint everywhere as that has been the value proven to work fine for many years.
SETDEFAULT("-checkpointMode", "PASSIVE");

args["-plugins"] = SComposeList(loadPlugins(args));

// Reset the database if requested
Expand Down
34 changes: 29 additions & 5 deletions sqlitecluster/SQLite.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -198,17 +198,24 @@ void SQLite::commonConstructorInitialization(bool hctree) {

// Always set synchronous commits to off for best commit performance in WAL mode.
SASSERT(!SQuery(_db, "setting synchronous commits to off", "PRAGMA synchronous = OFF;"));

// For non-passive checkpoints, we must set a busy timeout in order to wait on any readers.
// We set it to 2 minutes as the majority of transactions should take less than that.
if (_checkpointMode != SQLITE_CHECKPOINT_PASSIVE) {
sqlite3_busy_timeout(_db, 120'000);
}
}

SQLite::SQLite(const string& filename, int cacheSize, int maxJournalSize,
int minJournalTables, int64_t mmapSizeGB, bool hctree) :
int minJournalTables, int64_t mmapSizeGB, bool hctree, const string& checkpointMode) :
_filename(initializeFilename(filename)),
_maxJournalSize(maxJournalSize),
_db(initializeDB(_filename, mmapSizeGB, hctree)),
_journalNames(initializeJournal(_db, minJournalTables)),
_sharedData(initializeSharedData(_db, _filename, _journalNames, hctree)),
_cacheSize(cacheSize),
_mmapSizeGB(mmapSizeGB)
_mmapSizeGB(mmapSizeGB),
_checkpointMode(getCheckpointModeFromString(checkpointMode))
{
commonConstructorInitialization(hctree);
}
Expand All @@ -220,7 +227,8 @@ SQLite::SQLite(const SQLite& from) :
_journalNames(from._journalNames),
_sharedData(from._sharedData),
_cacheSize(from._cacheSize),
_mmapSizeGB(from._mmapSizeGB)
_mmapSizeGB(from._mmapSizeGB),
_checkpointMode(from._checkpointMode)
{
// This can always pass "true" because the copy constructor does not need to set the DB to WAL2 mode, it would have been set in the object being copied.
commonConstructorInitialization(true);
Expand Down Expand Up @@ -801,9 +809,9 @@ int SQLite::commit(const string& description, function<void()>* preCheckpointCal
if (_sharedData.outstandingFramesToCheckpoint) {
auto start = STimeNow();
int framesCheckpointed = 0;
sqlite3_wal_checkpoint_v2(_db, 0, SQLITE_CHECKPOINT_PASSIVE, NULL, &framesCheckpointed);
sqlite3_wal_checkpoint_v2(_db, 0, _checkpointMode, NULL, &framesCheckpointed);
auto end = STimeNow();
SINFO("Checkpointed " << framesCheckpointed << " (total) frames of " << _sharedData.outstandingFramesToCheckpoint << " in " << (end - start) << "us.");
SINFO("Checkpoint with type=" << _checkpointMode << " complete with " << framesCheckpointed << " frames checkpointed of " << _sharedData.outstandingFramesToCheckpoint << " frames outstanding in " << (end - start) << "us.");

// It might not actually be 0, but we'll just let sqlite tell us what it is next time _walHookCallback runs.
_sharedData.outstandingFramesToCheckpoint = 0;
Expand All @@ -828,6 +836,22 @@ int SQLite::commit(const string& description, function<void()>* preCheckpointCal
return result;
}

int SQLite::getCheckpointModeFromString(const string& checkpointModeString) {
if (checkpointModeString == "PASSIVE") {
return SQLITE_CHECKPOINT_PASSIVE;
}
if (checkpointModeString == "FULL") {
return SQLITE_CHECKPOINT_FULL;
}
if (checkpointModeString == "RESTART") {
return SQLITE_CHECKPOINT_RESTART;
}
if (checkpointModeString == "TRUNCATE") {
return SQLITE_CHECKPOINT_TRUNCATE;
}
SERROR("Invalid checkpoint type: " << checkpointModeString);
}

map<uint64_t, tuple<string, string, uint64_t>> SQLite::popCommittedTransactions() {
return _sharedData.popCommittedTransactions();
}
Expand Down
6 changes: 5 additions & 1 deletion sqlitecluster/SQLite.h
Original file line number Diff line number Diff line change
Expand Up @@ -57,7 +57,7 @@ class SQLite {
//
// mmapSizeGB: address space to use for memory-mapped IO, in GB.
SQLite(const string& filename, int cacheSize, int maxJournalSize, int minJournalTables,
int64_t mmapSizeGB = 0, bool hctree = false);
int64_t mmapSizeGB = 0, bool hctree = false, const string& checkpointMode = "PASSIVE");

// This constructor is not exactly a copy constructor. It creates an other SQLite object based on the first except
// with a *different* journal table. This avoids a lot of locking around creating structures that we know already
Expand Down Expand Up @@ -355,6 +355,7 @@ class SQLite {
static sqlite3* initializeDB(const string& filename, int64_t mmapSizeGB, bool hctree);
static vector<string> initializeJournal(sqlite3* db, int minJournalTables);
void commonConstructorInitialization(bool hctree = false);
static int getCheckpointModeFromString(const string& checkpointModeString);

// The filename of this DB, canonicalized to its full path on disk.
const string _filename;
Expand Down Expand Up @@ -527,4 +528,7 @@ class SQLite {

// Set to true inside of a write query.
bool _currentlyWriting{false};

// One of 0|1|2|3 (a.k.a. PASSIVE|FULL|RESTART|TRUNCATE), which is the value to be passed to sqlite3_wal_checkpoint_v2.
int _checkpointMode;
};
5 changes: 3 additions & 2 deletions sqlitecluster/SQLitePool.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -8,9 +8,10 @@ SQLitePool::SQLitePool(size_t maxDBs,
int maxJournalSize,
int minJournalTables,
int64_t mmapSizeGB,
bool hctree)
bool hctree,
const string& checkpointMode)
: _maxDBs(max(maxDBs, 1ul)),
_baseDB(filename, cacheSize, maxJournalSize, minJournalTables, mmapSizeGB, hctree),
_baseDB(filename, cacheSize, maxJournalSize, minJournalTables, mmapSizeGB, hctree, checkpointMode),
_objects(_maxDBs, nullptr)
{
}
Expand Down
2 changes: 1 addition & 1 deletion sqlitecluster/SQLitePool.h
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@ class SQLitePool {
public:
// Create a pool of DB handles.
SQLitePool(size_t maxDBs, const string& filename, int cacheSize, int maxJournalSize, int minJournalTables,
int64_t mmapSizeGB = 0, bool hctree = false);
int64_t mmapSizeGB = 0, bool hctree = false, const string& checkpointMode = "PASSIVE");
~SQLitePool();

// Get the base object (the first one created, which uses the `journal` table). Note that if called by multiple
Expand Down

0 comments on commit a74a5d6

Please sign in to comment.