nostrdb

an unfairly fast embedded nostr database backed by lmdb
git clone git://jb55.com/nostrdb
Log | Files | Refs | Submodules | README | LICENSE

commit 423598b0f747920369a8625d9aca5298b8e6aa59
parent 6d63a70f95d2c1420185d459b6dd5cea82994af3
Author: William Casarin <jb55@jb55.com>
Date:   Sun, 15 Dec 2024 10:30:01 -0800

migrations: make migrations asyncronous

This also seems to fix some issues with older migrations.

Fixes: https://github.com/damus-io/nostrdb/issues/58

Diffstat:
Msrc/nostrdb.c | 296++++++++++++++++++++++++++++++++++++++-----------------------------------------
Msrc/nostrdb.h | 2+-
Mtest.c | 11+++++++++--
3 files changed, 153 insertions(+), 156 deletions(-)

diff --git a/src/nostrdb.c b/src/nostrdb.c @@ -57,7 +57,7 @@ static const int DEFAULT_QUEUE_SIZE = 32768; #define NDB_PARSED_TAGS (1 << 6) #define NDB_PARSED_ALL (NDB_PARSED_ID|NDB_PARSED_PUBKEY|NDB_PARSED_SIG|NDB_PARSED_CREATED_AT|NDB_PARSED_KIND|NDB_PARSED_CONTENT|NDB_PARSED_TAGS) -typedef int (*ndb_migrate_fn)(struct ndb *); +typedef int (*ndb_migrate_fn)(struct ndb_txn *); typedef int (*ndb_word_parser_fn)(void *, const char *word, int word_len, int word_index); @@ -135,6 +135,7 @@ enum ndb_writer_msgtype { NDB_WRITER_DBMETA, // write ndb metadata NDB_WRITER_PROFILE_LAST_FETCH, // when profiles were last fetched NDB_WRITER_BLOCKS, // write parsed note blocks + NDB_WRITER_MIGRATE, // migrate the database }; // keys used for storing data in the NDB metadata database (NDB_DB_NDB_META) @@ -1589,47 +1590,33 @@ cleanup: // // This was before we had note_profile_pubkey{,_kind} indices. Let's create them. -static int ndb_migrate_profile_indices(struct ndb *ndb) +static int ndb_migrate_profile_indices(struct ndb_txn *txn) { - struct ndb_txn txn; int count; - if (!ndb_begin_rw_query(ndb, &txn)) { - fprintf(stderr, "ndb_migrate_profile_indices: ndb_begin_rw_query failed\n"); - return 0; - } - enum ndb_dbs indices[] = {NDB_DB_NOTE_PUBKEY, NDB_DB_NOTE_PUBKEY_KIND}; - if ((count = ndb_rebuild_note_indices(&txn, indices, 2)) != -1) { + if ((count = ndb_rebuild_note_indices(txn, indices, 2)) != -1) { fprintf(stderr, "migrated %d notes to have pubkey and pubkey_kind indices\n", count); - ndb_end_query(&txn); return 1; } else { fprintf(stderr, "error migrating notes to have pubkey and pubkey_kind indices, aborting.\n"); - mdb_txn_abort(txn.mdb_txn); return 0; } } -static int ndb_migrate_user_search_indices(struct ndb *ndb) +static int ndb_migrate_user_search_indices(struct ndb_txn *txn) { int rc; MDB_cursor *cur; MDB_val k, v; void *profile_root; NdbProfileRecord_table_t record; - struct ndb_txn txn; struct ndb_note *note; uint64_t note_key, profile_key; size_t len; int count; - if (!ndb_begin_rw_query(ndb, &txn)) { - fprintf(stderr, "ndb_migrate_user_search_indices: ndb_begin_rw_query failed\n"); - return 0; - } - - if ((rc = mdb_cursor_open(txn.mdb_txn, ndb->lmdb.dbs[NDB_DB_PROFILE], &cur))) { + if ((rc = mdb_cursor_open(txn->mdb_txn, txn->lmdb->dbs[NDB_DB_PROFILE], &cur))) { fprintf(stderr, "ndb_migrate_user_search_indices: mdb_cursor_open failed, error %d\n", rc); return 0; } @@ -1642,18 +1629,16 @@ static int ndb_migrate_user_search_indices(struct ndb *ndb) profile_key = *((uint64_t*)k.mv_data); record = NdbProfileRecord_as_root(profile_root); note_key = NdbProfileRecord_note_key(record); - note = ndb_get_note_by_key(&txn, note_key, &len); + note = ndb_get_note_by_key(txn, note_key, &len); if (note == NULL) { - fprintf(stderr, "ndb_migrate_user_search_indices: note lookup failed\n"); - return 0; + continue; } - if (!ndb_write_profile_search_indices(&txn, note, profile_key, + if (!ndb_write_profile_search_indices(txn, note, profile_key, profile_root)) { - fprintf(stderr, "ndb_migrate_user_search_indices: ndb_write_profile_search_indices failed\n"); - return 0; + continue; } count++; @@ -1663,51 +1648,33 @@ static int ndb_migrate_user_search_indices(struct ndb *ndb) mdb_cursor_close(cur); - ndb_end_query(&txn); - return 1; } -static int ndb_migrate_lower_user_search_indices(struct ndb *ndb) +static int ndb_migrate_lower_user_search_indices(struct ndb_txn *txn) { - MDB_txn *txn; - - if (mdb_txn_begin(ndb->lmdb.env, NULL, 0, &txn)) { - fprintf(stderr, "ndb_migrate_lower_user_search_indices: ndb_txn_begin failed\n"); - return 0; - } - // just drop the search db so we can rebuild it - if (mdb_drop(txn, ndb->lmdb.dbs[NDB_DB_PROFILE_SEARCH], 0)) { + if (mdb_drop(txn->mdb_txn, txn->lmdb->dbs[NDB_DB_PROFILE_SEARCH], 0)) { fprintf(stderr, "ndb_migrate_lower_user_search_indices: mdb_drop failed\n"); return 0; } - mdb_txn_commit(txn); - - return ndb_migrate_user_search_indices(ndb); + return ndb_migrate_user_search_indices(txn); } int ndb_process_profile_note(struct ndb_note *note, struct ndb_profile_record_builder *profile); -int ndb_db_version(struct ndb *ndb) +int ndb_db_version(struct ndb_txn *txn) { - int rc; uint64_t version, version_key; MDB_val k, v; - MDB_txn *txn; version_key = NDB_META_KEY_VERSION; k.mv_data = &version_key; k.mv_size = sizeof(version_key); - if ((rc = mdb_txn_begin(ndb->lmdb.env, NULL, 0, &txn))) { - fprintf(stderr, "ndb_db_version: mdb_txn_begin failed, error %d\n", rc); - return -1; - } - - if (mdb_get(txn, ndb->lmdb.dbs[NDB_DB_NDB_META], &k, &v)) { + if (mdb_get(txn->mdb_txn, txn->lmdb->dbs[NDB_DB_NDB_META], &k, &v)) { version = -1; } else { if (v.mv_size != 8) { @@ -1717,7 +1684,6 @@ int ndb_db_version(struct ndb *ndb) version = *((uint64_t*)v.mv_data); } - mdb_txn_abort(txn); return version; } @@ -1857,30 +1823,29 @@ static inline int ndb_writer_queue_msg(struct ndb_writer *writer, return prot_queue_push(&writer->inbox, msg); } -static int ndb_migrate_utf8_profile_names(struct ndb *ndb) +static uint64_t ndb_write_note_and_profile(struct ndb_txn *txn, struct ndb_writer_profile *profile, unsigned char *scratch, size_t scratch_size, uint32_t ndb_flags); +static int ndb_migrate_utf8_profile_names(struct ndb_txn *txn) { int rc; MDB_cursor *cur; MDB_val k, v; void *profile_root; NdbProfileRecord_table_t record; - struct ndb_txn txn; struct ndb_note *note, *copied_note; uint64_t note_key; size_t len; - int count, failed; - struct ndb_writer_msg out; + int count, failed, ret; + struct ndb_writer_profile profile; - if (!ndb_begin_rw_query(ndb, &txn)) { - fprintf(stderr, "ndb_migrate_utf8_profile_names: ndb_begin_rw_query failed\n"); - return 0; - } - - if ((rc = mdb_cursor_open(txn.mdb_txn, ndb->lmdb.dbs[NDB_DB_PROFILE], &cur))) { + if ((rc = mdb_cursor_open(txn->mdb_txn, txn->lmdb->dbs[NDB_DB_PROFILE], &cur))) { fprintf(stderr, "ndb_migrate_utf8_profile_names: mdb_cursor_open failed, error %d\n", rc); return 0; } + size_t scratch_size = 8 * 1024 * 1024; + unsigned char *scratch = malloc(scratch_size); + + ret = 1; count = 0; failed = 0; @@ -1889,14 +1854,14 @@ static int ndb_migrate_utf8_profile_names(struct ndb *ndb) profile_root = v.mv_data; record = NdbProfileRecord_as_root(profile_root); note_key = NdbProfileRecord_note_key(record); - note = ndb_get_note_by_key(&txn, note_key, &len); + note = ndb_get_note_by_key(txn, note_key, &len); if (note == NULL) { - fprintf(stderr, "ndb_migrate_utf8_profile_names: note lookup failed\n"); - return 0; + failed++; + continue; } - struct ndb_profile_record_builder *b = &out.profile.record; + struct ndb_profile_record_builder *b = &profile.record; // reprocess profile if (!ndb_process_profile_note(note, b)) { @@ -1908,13 +1873,14 @@ static int ndb_migrate_utf8_profile_names(struct ndb *ndb) copied_note = malloc(len); memcpy(copied_note, note, len); - out.type = NDB_WRITER_PROFILE; - out.profile.note.note = copied_note; - out.profile.note.note_len = len; + profile.note.note = copied_note; + profile.note.note_len = len; - ndb_writer_queue_msg(&ndb->writer, &out); - - count++; + // we don't pass in flags when migrating... a bit sketchy but + // whatever. noone is using this to customize nostrdb atm + if (ndb_write_note_and_profile(txn, &profile, scratch, scratch_size, 0)) { + count++; + } } fprintf(stderr, "migrated %d profiles to fix utf8 profile names\n", count); @@ -1923,11 +1889,10 @@ static int ndb_migrate_utf8_profile_names(struct ndb *ndb) fprintf(stderr, "failed to migrate %d profiles to fix utf8 profile names\n", failed); } + free(scratch); mdb_cursor_close(cur); - ndb_end_query(&txn); - - return 1; + return ret; } static struct ndb_migration MIGRATIONS[] = { @@ -4227,29 +4192,6 @@ static uint64_t ndb_write_note(struct ndb_txn *txn, return note_key; } -// only to be called from the writer thread -static void ndb_write_version(struct ndb_txn *txn, uint64_t version) -{ - int rc; - MDB_val key, val; - uint64_t version_key; - - version_key = NDB_META_KEY_VERSION; - - key.mv_data = &version_key; - key.mv_size = sizeof(version_key); - val.mv_data = &version; - val.mv_size = sizeof(version); - - if ((rc = mdb_put(txn->mdb_txn, txn->lmdb->dbs[NDB_DB_NDB_META], &key, &val, 0))) { - ndb_debug("write version to ndb_meta failed: %s\n", - mdb_strerror(rc)); - return; - } - - //fprintf(stderr, "writing version %" PRIu64 "\n", version); -} - static void ndb_monitor_lock(struct ndb_monitor *mon) { pthread_mutex_lock(&mon->mutex); } @@ -4311,6 +4253,93 @@ static void ndb_notify_subscriptions(struct ndb_monitor *monitor, ndb_monitor_unlock(monitor); } +uint64_t ndb_write_note_and_profile( + struct ndb_txn *txn, + struct ndb_writer_profile *profile, + unsigned char *scratch, + size_t scratch_size, + uint32_t ndb_flags) +{ + uint64_t note_nkey; + + note_nkey = ndb_write_note(txn, &profile->note, scratch, scratch_size, ndb_flags); + + if (profile->record.builder) { + // only write if parsing didn't fail + ndb_write_profile(txn, profile, note_nkey); + } + + return note_nkey; +} + +// only to be called from the writer thread +static int ndb_write_version(struct ndb_txn *txn, uint64_t version) +{ + int rc; + MDB_val key, val; + uint64_t version_key; + + version_key = NDB_META_KEY_VERSION; + + key.mv_data = &version_key; + key.mv_size = sizeof(version_key); + val.mv_data = &version; + val.mv_size = sizeof(version); + + if ((rc = mdb_put(txn->mdb_txn, txn->lmdb->dbs[NDB_DB_NDB_META], &key, &val, 0))) { + ndb_debug("write version to ndb_meta failed: %s\n", + mdb_strerror(rc)); + return 0; + } + + //fprintf(stderr, "writing version %" PRIu64 "\n", version); + return 1; +} + + +static int ndb_run_migrations(struct ndb_txn *txn) +{ + int64_t version, latest_version, i; + + latest_version = sizeof(MIGRATIONS) / sizeof(MIGRATIONS[0]); + + if ((version = ndb_db_version(txn)) == -1) { + ndb_debug("run_migrations: no version found, assuming new db\n"); + version = latest_version; + + // no version found. fresh db? + if (!ndb_write_version(txn, version)) { + fprintf(stderr, "run_migrations: failed writing db version"); + return 0; + } + + return 1; + } else { + ndb_debug("ndb: version %" PRIu64 " found\n", version); + } + + if (version < latest_version) + fprintf(stderr, "nostrdb: migrating v%d -> v%d\n", + (int)version, (int)latest_version); + + for (i = version; i < latest_version; i++) { + if (!MIGRATIONS[i].fn(txn)) { + fprintf(stderr, "run_migrations: migration v%d -> v%d failed\n", (int)i, (int)(i+1)); + return 0; + } + + if (!ndb_write_version(txn, i+1)) { + fprintf(stderr, "run_migrations: failed writing db version"); + return 0; + } + + version = i+1; + } + + return 1; +} + + static void *ndb_writer_thread(void *data) { ndb_debug("started writer thread\n"); @@ -4346,6 +4375,7 @@ static void *ndb_writer_thread(void *data) case NDB_WRITER_DBMETA: needs_commit = 1; break; case NDB_WRITER_PROFILE_LAST_FETCH: needs_commit = 1; break; case NDB_WRITER_BLOCKS: needs_commit = 1; break; + case NDB_WRITER_MIGRATE: needs_commit = 1; break; case NDB_WRITER_QUIT: break; } } @@ -4369,24 +4399,22 @@ static void *ndb_writer_thread(void *data) continue; case NDB_WRITER_PROFILE: note_nkey = - ndb_write_note(&txn, &msg->note, - scratch, scratch_size, - writer->ndb_flags); + ndb_write_note_and_profile( + &txn, + &msg->profile, + scratch, + scratch_size, + writer->ndb_flags); + if (note_nkey > 0) { written_notes[num_notes++] = (struct written_note){ .note_id = note_nkey, - .note = &msg->note, + .note = &msg->profile.note, }; } else { ndb_debug("failed to write note\n"); } - if (msg->profile.record.builder) { - // only write if parsing didn't fail - ndb_write_profile(&txn, &msg->profile, - note_nkey); - } - break; case NDB_WRITER_NOTE: note_nkey = ndb_write_note(&txn, &msg->note, scratch, @@ -4407,6 +4435,12 @@ static void *ndb_writer_thread(void *data) ndb_write_blocks(&txn, msg->blocks.note_key, msg->blocks.blocks); break; + case NDB_WRITER_MIGRATE: + if (!ndb_run_migrations(&txn)) { + mdb_txn_abort(txn.mdb_txn); + goto bail; + } + break; case NDB_WRITER_PROFILE_LAST_FETCH: ndb_writer_last_profile_fetch(&txn, msg->last_fetch.pubkey, @@ -4443,6 +4477,7 @@ static void *ndb_writer_thread(void *data) } } +bail: free(scratch); ndb_debug("quitting writer thread\n"); return NULL; @@ -4753,50 +4788,6 @@ static int ndb_queue_write_version(struct ndb *ndb, uint64_t version) return ndb_writer_queue_msg(&ndb->writer, &msg); } -static int ndb_run_migrations(struct ndb *ndb) -{ - int64_t version, latest_version, i; - - latest_version = sizeof(MIGRATIONS) / sizeof(MIGRATIONS[0]); - - if ((version = ndb_db_version(ndb)) == -1) { - ndb_debug("run_migrations: no version found, assuming new db\n"); - version = latest_version; - - // no version found. fresh db? - if (!ndb_queue_write_version(ndb, version)) { - fprintf(stderr, "run_migrations: failed writing db version"); - return 0; - } - - return 1; - } else { - ndb_debug("ndb: version %" PRIu64 " found\n", version); - } - - if (version < latest_version) - fprintf(stderr, "nostrdb: migrating v%d -> v%d\n", - (int)version, (int)latest_version); - - for (i = version; i < latest_version; i++) { - if (!MIGRATIONS[i].fn(ndb)) { - fprintf(stderr, "run_migrations: migration v%d -> v%d failed\n", (int)i, (int)(i+1)); - return 0; - } - - if (!ndb_queue_write_version(ndb, i+1)) { - fprintf(stderr, "run_migrations: failed writing db version"); - return 0; - } - - version = i+1; - } - - ndb->version = version; - - return 1; -} - static void ndb_monitor_init(struct ndb_monitor *monitor, ndb_sub_fn cb, void *sub_cb_ctx) { @@ -4861,10 +4852,9 @@ int ndb_init(struct ndb **pndb, const char *filename, const struct ndb_config *c return 0; } - if (!ndb_flag_set(config->flags, NDB_FLAG_NOMIGRATE) && - !ndb_run_migrations(ndb)) { - fprintf(stderr, "failed to run migrations\n"); - return 0; + if (!ndb_flag_set(config->flags, NDB_FLAG_NOMIGRATE)) { + struct ndb_writer_msg msg = { .type = NDB_WRITER_MIGRATE }; + ndb_writer_queue_msg(&ndb->writer, &msg); } // Initialize LMDB environment and spin up threads diff --git a/src/nostrdb.h b/src/nostrdb.h @@ -458,7 +458,7 @@ int ndb_note_verify(void *secp_ctx, unsigned char pubkey[32], unsigned char id[3 // NDB int ndb_init(struct ndb **ndb, const char *dbdir, const struct ndb_config *); -int ndb_db_version(struct ndb *ndb); +int ndb_db_version(struct ndb_txn *txn); int ndb_process_event(struct ndb *, const char *json, int len); int ndb_process_events(struct ndb *, const char *ldjson, size_t len); #ifndef _WIN32 diff --git a/test.c b/test.c @@ -470,12 +470,16 @@ static void test_migrate() { static const char *v0_dir = "testdata/db/v0"; struct ndb *ndb; struct ndb_config config; + struct ndb_txn txn; + ndb_default_config(&config); ndb_config_set_flags(&config, NDB_FLAG_NOMIGRATE); fprintf(stderr, "testing migrate on v0\n"); assert(ndb_init(&ndb, v0_dir, &config)); - assert(ndb_db_version(ndb) == 0); + assert(ndb_begin_query(ndb, &txn)); + assert(ndb_db_version(&txn) == 0); + assert(ndb_end_query(&txn)); ndb_destroy(ndb); ndb_config_set_flags(&config, 0); @@ -483,7 +487,10 @@ static void test_migrate() { assert(ndb_init(&ndb, v0_dir, &config)); ndb_destroy(ndb); assert(ndb_init(&ndb, v0_dir, &config)); - assert(ndb_db_version(ndb) == 3); + + assert(ndb_begin_query(ndb, &txn)); + assert(ndb_db_version(&txn) == 3); + assert(ndb_end_query(&txn)); test_profile_search(ndb); ndb_destroy(ndb);