diff --git a/ci/scripts/run-tests-linux.sh b/ci/scripts/run-tests-linux.sh index 6da582f66..048fd503b 100755 --- a/ci/scripts/run-tests-linux.sh +++ b/ci/scripts/run-tests-linux.sh @@ -48,8 +48,11 @@ function run_db_tests(){ cd $WORKDIR/build && \ make test && \ make test-client && \ - run_pgvector_tests && \ - killall postgres && \ + run_pgvector_tests + pg_pid=$(fuser -a 5432/tcp 2>/dev/null | awk "{print $1}" | awk '{$1=$1};1') + if [[ ! -z "$pg_pid" ]]; then + kill -9 $pg_pid + fi gcovr -r $WORKDIR/src/ --object-directory $WORKDIR/build/ --xml /tmp/coverage.xml fi } diff --git a/src/hnsw/build.c b/src/hnsw/build.c index 6b5c554c4..ebc0a8c99 100644 --- a/src/hnsw/build.c +++ b/src/hnsw/build.c @@ -358,7 +358,7 @@ static void InitBuildState(HnswBuildState *buildstate, Relation heap, Relation i buildstate->index_file_path = ldb_HnswGetIndexFilePath(index); // If a dimension wasn't specified try to infer it - if(buildstate->dimensions < 1) { + if(heap != NULL && buildstate->dimensions < 1) { buildstate->dimensions = InferDimension(heap, indexInfo); } /* Require column to have dimensions to be indexed */ @@ -416,10 +416,9 @@ static void ScanTable(HnswBuildState *buildstate) } /* - * Build the index + * Build the index, writing to the main fork */ -static void BuildIndex( - Relation heap, Relation index, IndexInfo *indexInfo, HnswBuildState *buildstate, ForkNumber forkNum) +static void BuildIndex(Relation heap, Relation index, IndexInfo *indexInfo, HnswBuildState *buildstate) { usearch_error_t error = NULL; usearch_init_options_t opts; @@ -543,7 +542,7 @@ static void BuildIndex( //****************************** saving to WAL BEGIN ******************************// UpdateProgress(PROGRESS_CREATEIDX_PHASE, PROGRESS_HNSW_PHASE_LOAD); - StoreExternalIndex(index, &metadata, forkNum, result_buf, &opts, num_added_vectors); + StoreExternalIndex(index, &metadata, MAIN_FORKNUM, result_buf, &opts, num_added_vectors); //****************************** saving to WAL END ******************************// munmap_ret = munmap(result_buf, index_file_stat.st_size); @@ -560,6 +559,38 @@ static void BuildIndex( FreeBuildState(buildstate); } +/* + * Build an empty index, writing to the init fork + */ +static void BuildEmptyIndex(Relation index, IndexInfo *indexInfo, HnswBuildState *buildstate) +{ + usearch_error_t error = NULL; + usearch_init_options_t opts; + MemSet(&opts, 0, sizeof(opts)); + + InitBuildState(buildstate, NULL, index, indexInfo); + opts.dimensions = buildstate->dimensions; + PopulateUsearchOpts(index, &opts); + + buildstate->usearch_index = usearch_init(&opts, &error); + assert(error == NULL); + + buildstate->hnsw = NULL; + + char *result_buf = NULL; + usearch_save(buildstate->usearch_index, NULL, &result_buf, &error); + assert(error == NULL && result_buf != NULL); + + StoreExternalEmptyIndex(index, INIT_FORKNUM, result_buf, &opts); + + usearch_free(buildstate->usearch_index, &error); + free(result_buf); + assert(error == NULL); + buildstate->usearch_index = NULL; + + FreeBuildState(buildstate); +} + /* * Build the index for a logged table */ @@ -568,7 +599,7 @@ IndexBuildResult *ldb_ambuild(Relation heap, Relation index, IndexInfo *indexInf IndexBuildResult *result; HnswBuildState buildstate; - BuildIndex(heap, index, indexInfo, &buildstate, MAIN_FORKNUM); + BuildIndex(heap, index, indexInfo, &buildstate); result = (IndexBuildResult *)palloc(sizeof(IndexBuildResult)); result->heap_tuples = buildstate.reltuples; @@ -578,13 +609,13 @@ IndexBuildResult *ldb_ambuild(Relation heap, Relation index, IndexInfo *indexInf } /* - * Build the index for an unlogged table + * Build an empty index for an unlogged table */ void ldb_ambuildunlogged(Relation index) { - LDB_UNUSED(index); - // todo:: - elog(ERROR, "hnsw index on unlogged tables is currently not supported"); + HnswBuildState buildstate; + IndexInfo *indexInfo = BuildIndexInfo(index); + BuildEmptyIndex(index, indexInfo, &buildstate); } void ldb_reindex_external_index(Oid indrelid) diff --git a/src/hnsw/external_index.c b/src/hnsw/external_index.c index 85613b8d2..dc0317ac8 100644 --- a/src/hnsw/external_index.c +++ b/src/hnsw/external_index.c @@ -8,6 +8,7 @@ #include #include #include +#include // START_CRIT_SECTION, END_CRIT_SECTION #include // BLCKSZ #include // Buffer #include @@ -119,11 +120,13 @@ static void UpdateHeaderBlockMapGroupDesc( hdr_copy->blockmap_groups[ groupno ] = *desc; log_rec_ptr = GenericXLogFinish(state); - assert(log_rec_ptr != InvalidXLogRecPtr); - if(flush_log) { - LDB_FAILURE_POINT_CRASH_IF_ENABLED("just_before_wal_flush"); - XLogFlush(log_rec_ptr); - LDB_FAILURE_POINT_CRASH_IF_ENABLED("just_after_wal_flush"); + if(RelationNeedsWAL(index)) { + assert(log_rec_ptr != InvalidXLogRecPtr); + if(flush_log) { + LDB_FAILURE_POINT_CRASH_IF_ENABLED("just_before_wal_flush"); + XLogFlush(log_rec_ptr); + LDB_FAILURE_POINT_CRASH_IF_ENABLED("just_after_wal_flush"); + } } ReleaseBuffer(hdr_buf); } @@ -417,7 +420,9 @@ void StoreExternalIndexBlockMapGroup(Relation index, // When the blockmap page group was created, header block was updated accordingly in // ContinueBlockMapGroupInitialization call above. const BlockNumber blockmapno = blockmap_id + headerp->blockmap_groups[ blockmap_groupno ].first_block; - Buffer buf = ReadBufferExtended(index, MAIN_FORKNUM, blockmapno, RBM_NORMAL, NULL); + // todo:: should MAIN_FORKNUM be hardcoded here or use the forkNum parameter, from a code readability standpoint + // (other places in this file as well) + Buffer buf = ReadBufferExtended(index, MAIN_FORKNUM, blockmapno, RBM_NORMAL, NULL); LockBuffer(buf, BUFFER_LOCK_EXCLUSIVE); GenericXLogState *state = GenericXLogStart(index); @@ -433,6 +438,68 @@ void StoreExternalIndexBlockMapGroup(Relation index, } } +void StoreExternalEmptyIndex(Relation index, ForkNumber forkNum, char *data, usearch_init_options_t *opts) +{ + // this method is intended to store empty indexes for unlogged tables (ambuildempty method) and should hence be + // called with forkNum = INIT_FORKNUM + + Buffer header_buf = ReadBufferExtended(index, forkNum, P_NEW, RBM_NORMAL, NULL); + + // even when we are creating a new page, it must always be the first page we create + // and should therefore have BlockNumber 0 + assert(BufferGetBlockNumber(header_buf) == 0); + + LockBuffer(header_buf, BUFFER_LOCK_EXCLUSIVE); + + START_CRIT_SECTION(); + + Page header_page = BufferGetPage(header_buf); + + PageInit(header_page, BufferGetPageSize(header_buf), 0); + + HnswIndexHeaderPage *headerp = (HnswIndexHeaderPage *)PageGetContents(header_page); + + headerp->magicNumber = LDB_WAL_MAGIC_NUMBER; + headerp->version = LDB_WAL_VERSION_NUMBER; + headerp->vector_dim = opts->dimensions; + headerp->m = opts->connectivity; + headerp->ef_construction = opts->expansion_add; + headerp->ef = opts->expansion_search; + headerp->metric_kind = opts->metric_kind; + + headerp->num_vectors = 0; + headerp->blockmap_groups_nr = 0; + + for(uint32 i = 0; i < lengthof(headerp->blockmap_groups); ++i) { + headerp->blockmap_groups[ i ] = (HnswBlockMapGroupDesc){ + .first_block = InvalidBlockNumber, + .blockmaps_initialized = 0, + }; + } + + headerp->last_data_block = InvalidBlockNumber; + + memcpy(headerp->usearch_header, data, USEARCH_HEADER_SIZE); + ((PageHeader)header_page)->pd_lower = ((char *)headerp + sizeof(HnswIndexHeaderPage)) - (char *)header_page; + + MarkBufferDirty(header_buf); + + // Write a WAL record containing a full image of the page. Even though this is an unlogged table that doesn't use + // WAL, this line appears to flush changes to disc immediately (and not waiting after the first checkpoint). This is + // important because this empty index will live in the init fork, where it will be used to reset the unlogged index + // after a crash, and so we need this written to disc in order to have proper crash recovery functionality available + // immediately. Otherwise, if a crash occurs before the first postgres checkpoint, postgres can't read the init fork + // from disc and we will have a corrupted index when postgres attempts recovery. This is also what nbtree access + // method's implementation does for empty unlogged indexes (ambuildempty implementation). + // NOTE: we MUST have this be inside a crit section, or else an assertion inside this method will fail and crash the + // db + log_newpage_buffer(header_buf, false); + + END_CRIT_SECTION(); + + UnlockReleaseBuffer(header_buf); +} + void StoreExternalIndex(Relation index, usearch_metadata_t *external_index_metadata, ForkNumber forkNum, diff --git a/src/hnsw/external_index.h b/src/hnsw/external_index.h index 519383d82..3c78d49c3 100644 --- a/src/hnsw/external_index.h +++ b/src/hnsw/external_index.h @@ -122,6 +122,7 @@ typedef struct } HnswInsertState; uint32 UsearchNodeBytes(usearch_metadata_t *metadata, int vector_bytes, int level); +void StoreExternalEmptyIndex(Relation index, ForkNumber forkNum, char *data, usearch_init_options_t *opts); void StoreExternalIndex(Relation index, usearch_metadata_t *external_index_metadata, ForkNumber forkNum, diff --git a/src/hnsw/extra_dirtied.c b/src/hnsw/extra_dirtied.c index b371303f5..7d8ca9d05 100644 --- a/src/hnsw/extra_dirtied.c +++ b/src/hnsw/extra_dirtied.c @@ -84,6 +84,25 @@ void extra_dirtied_release_all(ExtraDirtiedBufs *ed) ed->extra_dirtied_size = 0; } +// Like extra_dirtied_release_all but does not perform a InvalidXLogRecPtr check. +// Used for inserts on unlogged tables, which do not write to WAL +void extra_dirtied_release_all_no_xlog_check(ExtraDirtiedBufs *ed) +{ + for(int i = 0; i < ed->extra_dirtied_state_size; ++i) { + GenericXLogFinish(ed->extra_dirtied_state[ i ]); + } + + for(int i = 0; i < ed->extra_dirtied_size; i++) { + assert(BufferIsValid(ed->extra_dirtied_buf[ i ])); + // header is not considered extra. we know we should not have dirtied it + // sanity check callees that manimulate extra_dirtied did not violate this + assert(ed->extra_dirtied_blockno[ i ] != 0); + // MarkBufferDirty() had been called by by GenericXLogFinish() already + UnlockReleaseBuffer(ed->extra_dirtied_buf[ i ]); + } + ed->extra_dirtied_size = 0; +} + void extra_dirtied_free(ExtraDirtiedBufs *ed) { if(ed->extra_dirtied_size != 0) { diff --git a/src/hnsw/extra_dirtied.h b/src/hnsw/extra_dirtied.h index 210001144..491207cae 100644 --- a/src/hnsw/extra_dirtied.h +++ b/src/hnsw/extra_dirtied.h @@ -33,6 +33,7 @@ void extra_dirtied_add_wal_read_buffer( ExtraDirtiedBufs* ed, Relation index, ForkNumber forkNum, BlockNumber blockno, Buffer* buf, Page* page); Page extra_dirtied_get(ExtraDirtiedBufs* ed, BlockNumber blockno, Buffer* out_buf); void extra_dirtied_release_all(ExtraDirtiedBufs* ed); +void extra_dirtied_release_all_no_xlog_check(ExtraDirtiedBufs* ed); void extra_dirtied_free(ExtraDirtiedBufs* ed); #endif // LDB_HNSW_EXTRA_DIRTIED_H diff --git a/src/hnsw/insert.c b/src/hnsw/insert.c index 2070bd3f1..6e5e090cd 100644 --- a/src/hnsw/insert.c +++ b/src/hnsw/insert.c @@ -72,6 +72,7 @@ bool ldb_aminsert(Relation index, HnswIndexTuple *new_tuple; usearch_init_options_t opts = {0}; LDB_UNUSED(heap); + LDB_UNUSED(indexInfo); #if PG_VERSION_NUM >= 140000 LDB_UNUSED(indexUnchanged); #endif @@ -109,7 +110,7 @@ bool ldb_aminsert(Relation index, hdr = (HnswIndexHeaderPage *)PageGetContents(hdr_page); assert(hdr->magicNumber == LDB_WAL_MAGIC_NUMBER); - opts.dimensions = GetHnswIndexDimensions(index, indexInfo); + opts.dimensions = hdr->vector_dim; CheckHnswIndexDimensions(index, values[ 0 ], opts.dimensions); PopulateUsearchOpts(index, &opts); opts.retriever_ctx = ldb_wal_retriever_area_init(index, hdr); @@ -182,16 +183,23 @@ bool ldb_aminsert(Relation index, ldb_wal_retriever_area_reset(insertstate->retriever_ctx, hdr); + int needs_wal = RelationNeedsWAL(index); // we only release the header buffer AFTER inserting is finished to make sure nobody else changes the block // structure. todo:: critical section here can definitely be shortened { // GenericXLogFinish also calls MarkBufferDirty(buf) XLogRecPtr ptr = GenericXLogFinish(state); - assert(ptr != InvalidXLogRecPtr); + if(needs_wal) { + assert(ptr != InvalidXLogRecPtr); + } LDB_UNUSED(ptr); } - extra_dirtied_release_all(insertstate->retriever_ctx->extra_dirted); + if(needs_wal) { + extra_dirtied_release_all(insertstate->retriever_ctx->extra_dirted); + } else { + extra_dirtied_release_all_no_xlog_check(insertstate->retriever_ctx->extra_dirted); + } usearch_free(insertstate->uidx, &error); if(error != NULL) { diff --git a/test/c/replica_test_unlogged.c b/test/c/replica_test_unlogged.c new file mode 100644 index 000000000..c1deb8762 --- /dev/null +++ b/test/c/replica_test_unlogged.c @@ -0,0 +1,125 @@ +#include +#include +#include + +#include "runner.h" + +int replica_test_unlogged(TestCaseState* state) +{ + /* + Test Outline + ============= + 1. Create unlogged table and index on it (and insert data) + 2. Make table logged + 3. Insert data on master + 4. Crash and restart slave and call validate_index on it + */ + + PGresult* res; + + // Create unlogged table, index, and insert data + res = PQexec(state->conn, + "DROP TABLE IF EXISTS small_world;" + "CREATE UNLOGGED TABLE small_world (id SERIAL PRIMARY KEY, v real[]);" + "CREATE INDEX ON small_world USING hnsw (v) WITH (dim=3);" + "INSERT INTO small_world (v) VALUES (ARRAY[0,0,1]), (ARRAY[0,1,0]), (ARRAY[1,0,0]);" + "CHECKPOINT;"); + + if(PQresultStatus(res) != PGRES_COMMAND_OK) { + fprintf(stderr, "Failed to prepare unlogged table, create index, and insert data on it: %s\n", PQerrorMessage(state->conn)); + PQclear(res); + return 1; + } + + PQclear(res); + + // Validate index on master + res = PQexec(state->conn, "SELECT _lantern_internal.validate_index('small_world_v_idx', false);"); + + if(PQresultStatus(res) != PGRES_TUPLES_OK) { + fprintf(stderr, "Failed to validate index on master: %s\n", PQerrorMessage(state->conn)); + PQclear(res); + return 1; + } + + PQclear(res); + + // Alter table to be logged + res = PQexec(state->conn, + "ALTER TABLE small_world SET LOGGED;"); + + if(PQresultStatus(res) != PGRES_COMMAND_OK) { + fprintf(stderr, "Failed to alter unlogged table to logged: %s\n", PQerrorMessage(state->conn)); + PQclear(res); + return 1; + } + + PQclear(res); + + // Insert some more data + res = PQexec(state->conn, + "INSERT INTO small_world (v) VALUES (ARRAY[1,2,3])"); + + if(PQresultStatus(res) != PGRES_COMMAND_OK) { + fprintf(stderr, "Failed to insert more data into the now logged table: %s\n", PQerrorMessage(state->conn)); + PQclear(res); + return 1; + } + + PQclear(res); + + // Validate index on master after changing table to be logged and inserting data + res = PQexec(state->conn, "SELECT _lantern_internal.validate_index('small_world_v_idx', false);"); + + if(PQresultStatus(res) != PGRES_TUPLES_OK) { + fprintf(stderr, "Failed to validate index on master: %s\n", PQerrorMessage(state->conn)); + PQclear(res); + return 1; + } + + PQclear(res); + + sleep(2); // wait for replica to sync + + // Validate index on replica + res = PQexec(state->replica_conn, "SELECT _lantern_internal.validate_index('small_world_v_idx', false);"); + + if(PQresultStatus(res) != PGRES_TUPLES_OK) { + fprintf(stderr, "Failed to validate index on replica: %s\n", PQerrorMessage(state->replica_conn)); + PQclear(res); + return 1; + } + + PQclear(res); + + // Test query on replica + res = PQexec(state->replica_conn, "SELECT v <-> '{1,1,1}' FROM small_world ORDER BY v <-> '{1,1,1}' LIMIT 10;"); + + if(PQresultStatus(res) != PGRES_TUPLES_OK) { + fprintf(stderr, "Failed to query index on replica: %s\n", PQerrorMessage(state->conn)); + PQclear(res); + return 1; + } + + PQclear(res); + + // Crash replica: + system("bash -c '. ../ci/scripts/bitnami-utils.sh && crash_and_restart_postgres_replica'"); + state->replica_conn = connect_database( + state->DB_HOST, state->REPLICA_PORT, state->DB_USER, state->DB_PASSWORD, state->TEST_DB_NAME); + + // Validate index on replica after crash + res = PQexec(state->replica_conn, "SELECT _lantern_internal.validate_index('small_world_v_idx', true);"); + + if(PQresultStatus(res) != PGRES_TUPLES_OK) { + fprintf(stderr, "Failed to validate index on replica after restart: %s\n", PQerrorMessage(state->replica_conn)); + // Tail the log file to see crash error if any + system("tail /tmp/postgres-slave-conf/pg.log 2>/dev/null || true"); + PQclear(res); + return 1; + } + + PQclear(res); + + return 0; +} diff --git a/test/c/runner.c b/test/c/runner.c index 34095e75a..db3f3ad49 100644 --- a/test/c/runner.c +++ b/test/c/runner.c @@ -9,6 +9,7 @@ // Include your test files here #include "replica_test_index.c" +#include "replica_test_unlogged.c" #include "test_op_rewrite.c" // =========================== @@ -98,7 +99,8 @@ int main() struct TestCase test_cases[] = { // Add new test files here to be run {.name = "test_op_rewrite", .func = (TestCaseFunction)test_op_rewrite}, - {.name = "replica_test_index", .func = (TestCaseFunction)replica_test_index} + {.name = "replica_test_index", .func = (TestCaseFunction)replica_test_index}, + {.name = "replica_test_unlogged", .func = (TestCaseFunction)replica_test_unlogged} // ================================ }; @@ -113,12 +115,6 @@ int main() const char *ROOT_DB_NAME = "postgres"; PGconn *root_conn = NULL; - root_conn = connect_database(DB_HOST, DB_PORT, DB_USER, DB_PASSWORD, ROOT_DB_NAME); - - if(root_conn == NULL) { - return 1; - } - for(i = 0; i < sizeof(test_cases) / sizeof(struct TestCase); i++) { current_case = test_cases[ i ]; current_case_state.REPLICA_PORT = REPLICA_PORT; @@ -128,8 +124,15 @@ int main() current_case_state.DB_USER = DB_USER; current_case_state.TEST_DB_NAME = TEST_DB_NAME; + root_conn = connect_database(DB_HOST, DB_PORT, DB_USER, DB_PASSWORD, ROOT_DB_NAME); + printf("[+] Running test case '%s'...\n", current_case.name); + if(root_conn == NULL) { + fprintf(stderr, "[X] Can not connect to root database on port '%s'\n", DB_PORT); + return 1; + } + // Create test database if(recreate_database(root_conn, TEST_DB_NAME)) { fprintf(stderr, "[X] Failed to recreate test database\n"); @@ -144,7 +147,7 @@ int main() continue; } // Wait for replica to sync with master or test db will not exist - sleep(3); + sleep(7); current_case_state.replica_conn = connect_database(DB_HOST, REPLICA_PORT, DB_USER, DB_PASSWORD, TEST_DB_NAME); if(current_case_state.replica_conn == NULL) { @@ -183,13 +186,13 @@ int main() // Close test connection PQfinish(current_case_state.conn); + PQfinish(root_conn); if(ENABLE_REPLICA) { PQfinish(current_case_state.replica_conn); } printf("[+] Test case '%s' passed\n", current_case.name); } - PQfinish(root_conn); printf("[+] All tests passed\n"); return 0; } diff --git a/test/expected/hnsw_create_unlogged.out b/test/expected/hnsw_create_unlogged.out new file mode 100644 index 000000000..c2f95e6b4 --- /dev/null +++ b/test/expected/hnsw_create_unlogged.out @@ -0,0 +1,153 @@ +------------------------------------------------------------------------------ +-- Test HNSW index creation +------------------------------------------------------------------------------ +-- Validate that index creation works with a small number of vectors +\ir utils/small_world_array_unlogged.sql +CREATE UNLOGGED TABLE small_world ( + id VARCHAR(3), + b BOOLEAN, + v REAL[3] +); +INSERT INTO small_world (id, b, v) VALUES + ('000', TRUE, '{0,0,0}'), + ('001', TRUE, '{0,0,1}'), + ('010', FALSE, '{0,1,0}'), + ('011', TRUE, '{0,1,1}'), + ('100', FALSE, '{1,0,0}'), + ('101', FALSE, '{1,0,1}'), + ('110', FALSE, '{1,1,0}'), + ('111', TRUE, '{1,1,1}'); +\ir utils/sift1k_array_unlogged.sql +CREATE UNLOGGED TABLE IF NOT EXISTS sift_base1k ( + id SERIAL, + v REAL[] +); +COPY sift_base1k (v) FROM '/tmp/lantern/vector_datasets/sift_base1k_arrays.csv' WITH csv; +-- Validate that creating a secondary index works +CREATE INDEX ON sift_base1k USING hnsw (v) WITH (dim=128, M=4); +INFO: done init usearch index +INFO: inserted 1000 elements +INFO: done saving 1000 vectors +SELECT * FROM ldb_get_indexes('sift_base1k'); + indexname | size | indexdef | total_index_size +-------------------+--------+---------------------------------------------------------------------------------------------+------------------ + sift_base1k_v_idx | 632 kB | CREATE INDEX sift_base1k_v_idx ON public.sift_base1k USING hnsw (v) WITH (dim='128', m='4') | 632 kB +(1 row) + +SELECT _lantern_internal.validate_index('sift_base1k_v_idx', false); +INFO: validate_index() start for sift_base1k_v_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +-- Validate that index creation works with a larger number of vectors +\ir utils/sift10k_array_unlogged.sql +CREATE UNLOGGED TABLE IF NOT EXISTS sift_base10k ( + id SERIAL PRIMARY KEY, + v REAL[128] +); +\copy sift_base10k (v) FROM '/tmp/lantern/vector_datasets/siftsmall_base_arrays.csv' with csv; +SET lantern.pgvector_compat=FALSE; +CREATE INDEX hnsw_idx ON sift_base10k USING hnsw (v dist_l2sq_ops) WITH (M=2, ef_construction=10, ef=4, dim=128); +INFO: done init usearch index +INFO: inserted 10000 elements +INFO: done saving 10000 vectors +SELECT v AS v4444 FROM sift_base10k WHERE id = 4444 \gset +EXPLAIN (COSTS FALSE) SELECT * FROM sift_base10k order by v :'v4444' LIMIT 10; + QUERY PLAN +----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- + Limit + -> Index Scan using hnsw_idx on sift_base10k + Order By: (v '{55,61,11,4,5,2,13,24,65,49,13,9,23,37,94,38,54,11,14,14,40,31,50,44,53,4,0,0,27,17,8,34,12,10,4,4,22,52,68,53,9,2,0,0,2,116,119,64,119,2,0,0,2,30,119,119,116,5,0,8,47,9,5,60,7,7,10,23,56,50,23,5,28,68,6,18,24,65,50,9,119,75,3,0,1,8,12,85,119,11,4,6,8,9,5,74,25,11,8,20,18,12,2,21,11,90,25,32,33,15,2,9,84,67,8,4,22,31,11,33,119,30,3,6,0,0,0,26}'::real[]) +(3 rows) + +SELECT _lantern_internal.validate_index('hnsw_idx', false); +INFO: validate_index() start for hnsw_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +--- Validate that M values inside the allowed range [2, 128] do not throw an error +CREATE INDEX ON small_world USING hnsw (v) WITH (M=2); +INFO: done init usearch index +INFO: inserted 8 elements +INFO: done saving 8 vectors +CREATE INDEX ON small_world USING hnsw (v) WITH (M=128); +INFO: done init usearch index +INFO: inserted 8 elements +INFO: done saving 8 vectors +---- Validate that M values outside the allowed range [2, 128] throw an error +\set ON_ERROR_STOP off +CREATE INDEX ON small_world USING hnsw (v) WITH (M=1); +ERROR: value 1 out of bounds for option "m" +CREATE INDEX ON small_world USING hnsw (v) WITH (M=129); +ERROR: value 129 out of bounds for option "m" +\set ON_ERROR_STOP on +-- Validate index dimension inference +CREATE UNLOGGED TABLE small_world4 ( + id varchar(3), + vector real[] +); +-- If the first row is NULL we do not infer a dimension +\set ON_ERROR_STOP off +CREATE INDEX ON small_world4 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +ERROR: column does not have dimensions, please specify one +begin; +INSERT INTO small_world4 (id, vector) VALUES +('000', NULL), +('001', '{1,0,0,1}'); +CREATE INDEX ON small_world4 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +ERROR: column does not have dimensions, please specify one +rollback; +\set ON_ERROR_STOP on +INSERT INTO small_world4 (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,0,1,0}'), +('011', '{1,0,1,1}'), +('100', '{1,1,0,0}'), +('101', '{1,1,0,1}'), +('110', '{1,1,1,0}'), +('111', '{1,1,1,1}'); +CREATE INDEX small_world4_hnsw_idx ON small_world4 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +INFO: done init usearch index +INFO: inserted 8 elements +INFO: done saving 8 vectors +SELECT * FROM ldb_get_indexes('small_world4'); + indexname | size | indexdef | total_index_size +-----------------------+-------+---------------------------------------------------------------------------------------------------------------------------+------------------ + small_world4_hnsw_idx | 24 kB | CREATE INDEX small_world4_hnsw_idx ON public.small_world4 USING hnsw (vector) WITH (m='14', ef='22', ef_construction='2') | 24 kB +(1 row) + +-- the index will not allow changing the dimension of a vector element +\set ON_ERROR_STOP off +UPDATE small_world4 SET vector = '{0,0,0}' WHERE id = '000'; +ERROR: Wrong number of dimensions: 3 instead of 4 expected +UPDATE small_world4 SET vector = '{0,0,0}' WHERE id = '001'; +ERROR: Wrong number of dimensions: 3 instead of 4 expected +\set ON_ERROR_STOP on +INSERT INTO small_world4 (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,0,1,0}'); +SELECT _lantern_internal.validate_index('small_world4_hnsw_idx', false); +INFO: validate_index() start for small_world4_hnsw_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +-- without the index, I can change the dimension of a vector element +DROP INDEX small_world4_hnsw_idx; +UPDATE small_world4 SET vector = '{0,0,0}' WHERE id = '001'; +-- but then, I cannot create the same dimension-inferred index +\set ON_ERROR_STOP off +CREATE INDEX ON small_world4 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +INFO: done init usearch index +ERROR: Wrong number of dimensions: 3 instead of 4 expected +\set ON_ERROR_STOP on diff --git a/test/expected/hnsw_insert_unlogged.out b/test/expected/hnsw_insert_unlogged.out new file mode 100644 index 000000000..1c692dd9f --- /dev/null +++ b/test/expected/hnsw_insert_unlogged.out @@ -0,0 +1,153 @@ +--------------------------------------------------------------------- +-- Test HNSW index inserts on empty table +--------------------------------------------------------------------- +-- set an artificially low work_mem to make sure work_mem exceeded warnings are printed +set work_mem = '64kB'; +-- We do not actually print the warnings generated for exceeding work_mem because the work_mem +-- check does not work for postgres 13 and lower.So, if we printed the warnings, we would get a regression +-- failure in older postgres versions. We still reduce workmem to exercise relevant codepaths for coverage +set client_min_messages = 'ERROR'; +CREATE UNLOGGED TABLE small_world ( + id SERIAL PRIMARY KEY, + v REAL[2] -- this demonstates that postgres actually does not enforce real[] length as we actually insert vectors of length 3 +); +CREATE UNLOGGED TABLE small_world_int ( + id SERIAL PRIMARY KEY, + v INTEGER[] +); +CREATE INDEX ON small_world USING hnsw (v) WITH (dim=3); +INFO: done init usearch index +INFO: inserted 0 elements +INFO: done saving 0 vectors +SELECT _lantern_internal.validate_index('small_world_v_idx', false); +INFO: validate_index() start for small_world_v_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +-- Insert rows with valid vector data +INSERT INTO small_world (v) VALUES ('{0,0,1}'), ('{0,1,0}'); +INSERT INTO small_world (v) VALUES (NULL); +-- Attempt to insert a row with an incorrect vector length +\set ON_ERROR_STOP off +-- Cannot create an hnsw index with implicit typecasts (trying to cast integer[] to real[], in this case) +CREATE INDEX ON small_world_int USING hnsw (v dist_l2sq_ops) WITH (dim=3); +ERROR: operator class "dist_l2sq_ops" does not accept data type integer[] +INSERT INTO small_world (v) VALUES ('{1,1,1,1}'); +ERROR: Wrong number of dimensions: 4 instead of 3 expected +\set ON_ERROR_STOP on +DROP TABLE small_world; +-- set work_mem to a value that is enough for the tests +set client_min_messages = 'WARNING'; +set work_mem = '10MB'; +--------------------------------------------------------------------- +-- Test HNSW index inserts on non-empty table +--------------------------------------------------------------------- +\ir utils/small_world_array_unlogged.sql +CREATE UNLOGGED TABLE small_world ( + id VARCHAR(3), + b BOOLEAN, + v REAL[3] +); +INSERT INTO small_world (id, b, v) VALUES + ('000', TRUE, '{0,0,0}'), + ('001', TRUE, '{0,0,1}'), + ('010', FALSE, '{0,1,0}'), + ('011', TRUE, '{0,1,1}'), + ('100', FALSE, '{1,0,0}'), + ('101', FALSE, '{1,0,1}'), + ('110', FALSE, '{1,1,0}'), + ('111', TRUE, '{1,1,1}'); +CREATE INDEX ON small_world USING hnsw (v) WITH (dim=3); +INFO: done init usearch index +INFO: inserted 8 elements +INFO: done saving 8 vectors +SET enable_seqscan = false; +SET lantern.pgvector_compat = false; +-- Inserting vectors of the same dimension and nulls should work +INSERT INTO small_world (v) VALUES ('{1,1,2}'); +INSERT INTO small_world (v) VALUES (NULL); +-- Inserting vectors of different dimension should fail +\set ON_ERROR_STOP off +INSERT INTO small_world (v) VALUES ('{4,4,4,4}'); +ERROR: Wrong number of dimensions: 4 instead of 3 expected +\set ON_ERROR_STOP on +-- Verify that the index works with the inserted vectors +SELECT + ROUND(l2sq_dist(v, '{0,0,0}')::numeric, 2) +FROM + small_world +ORDER BY + v '{0,0,0}'; + round +------- + 0.00 + 1.00 + 1.00 + 1.00 + 2.00 + 2.00 + 2.00 + 3.00 + 6.00 +(9 rows) + +-- Ensure the index size remains consistent after inserts +SELECT * from ldb_get_indexes('small_world'); + indexname | size | indexdef | total_index_size +-------------------+-------+------------------------------------------------------------------------------------+------------------ + small_world_v_idx | 24 kB | CREATE INDEX small_world_v_idx ON public.small_world USING hnsw (v) WITH (dim='3') | 24 kB +(1 row) + +-- Ensure the query plan remains consistent after inserts +EXPLAIN (COSTS FALSE) +SELECT + ROUND(l2sq_dist(v, '{0,0,0}')::numeric, 2) +FROM + small_world +ORDER BY + v '{0,0,0}' +LIMIT 10; + QUERY PLAN +--------------------------------------------------------- + Limit + -> Index Scan using small_world_v_idx on small_world + Order By: (v '{0,0,0}'::real[]) +(3 rows) + +SELECT _lantern_internal.validate_index('small_world_v_idx', false); +INFO: validate_index() start for small_world_v_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +-- Test the index with a larger number of vectors +CREATE UNLOGGED TABLE sift_base10k ( + id SERIAL PRIMARY KEY, + v REAL[128] +); +CREATE INDEX hnsw_idx ON sift_base10k USING hnsw (v dist_l2sq_ops) WITH (M=2, ef_construction=10, ef=4, dim=128); +INFO: done init usearch index +INFO: inserted 0 elements +INFO: done saving 0 vectors +\COPY sift_base10k (v) FROM '/tmp/lantern/vector_datasets/siftsmall_base_arrays.csv' WITH CSV; +SELECT v AS v4444 FROM sift_base10k WHERE id = 4444 \gset +EXPLAIN (COSTS FALSE) SELECT * FROM sift_base10k order by v :'v4444'; + QUERY PLAN +----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- + Index Scan using hnsw_idx on sift_base10k + Order By: (v '{55,61,11,4,5,2,13,24,65,49,13,9,23,37,94,38,54,11,14,14,40,31,50,44,53,4,0,0,27,17,8,34,12,10,4,4,22,52,68,53,9,2,0,0,2,116,119,64,119,2,0,0,2,30,119,119,116,5,0,8,47,9,5,60,7,7,10,23,56,50,23,5,28,68,6,18,24,65,50,9,119,75,3,0,1,8,12,85,119,11,4,6,8,9,5,74,25,11,8,20,18,12,2,21,11,90,25,32,33,15,2,9,84,67,8,4,22,31,11,33,119,30,3,6,0,0,0,26}'::real[]) +(2 rows) + +SELECT _lantern_internal.validate_index('hnsw_idx', false); +INFO: validate_index() start for hnsw_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + diff --git a/test/expected/hnsw_logged_unlogged.out b/test/expected/hnsw_logged_unlogged.out new file mode 100644 index 000000000..4a88ca868 --- /dev/null +++ b/test/expected/hnsw_logged_unlogged.out @@ -0,0 +1,294 @@ +-- Test changing tables from logged to unlogged, and from unlogged to logged +-- -------------------------- +-- Start with logged table +-- -------------------------- +CREATE TABLE small_world ( + id varchar(3), + vector real[] +); +-- Insert (we insert data such that each vector has a unique distance from (0,0,0) +INSERT INTO small_world (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,1,1,0}'), +('011', '{1,1,1,1}'), +('100', '{2,1,0,0}'), +('101', '{1,2,0,1}'), +('110', '{1,2,1,1}'), +('111', '{2,2,2,0}'); +-- Create an index +CREATE INDEX small_world_idx ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +INFO: done init usearch index +INFO: inserted 8 elements +INFO: done saving 8 vectors +-- Validate index +SELECT _lantern_internal.validate_index('small_world_idx', false); +INFO: validate_index() start for small_world_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +-- Query +SET enable_seqscan = false; +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + id | l2sq_dist | vector +-----+-----------+----------- + 000 | 1 | {1,0,0,0} + 001 | 2 | {1,0,0,1} + 010 | 3 | {1,1,1,0} + 011 | 4 | {1,1,1,1} + 100 | 5 | {2,1,0,0} + 101 | 6 | {1,2,0,1} + 110 | 7 | {1,2,1,1} + 111 | 12 | {2,2,2,0} +(8 rows) + +-- Switch table to be unlogged +ALTER TABLE small_world SET UNLOGGED; +INFO: done init usearch index +INFO: inserted 8 elements +INFO: done saving 8 vectors +-- Create a new index +CREATE INDEX small_world_idx2 ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +INFO: done init usearch index +INFO: inserted 8 elements +INFO: done saving 8 vectors +-- Validate indexes +SELECT _lantern_internal.validate_index('small_world_idx', false); +INFO: validate_index() start for small_world_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +SELECT _lantern_internal.validate_index('small_world_idx2', false); +INFO: validate_index() start for small_world_idx2 +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +-- Insert +INSERT INTO small_world (id, vector) VALUES ('002', '{0,3,1,1}'); +-- Query +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + id | l2sq_dist | vector +-----+-----------+----------- + 000 | 1 | {1,0,0,0} + 001 | 2 | {1,0,0,1} + 010 | 3 | {1,1,1,0} + 011 | 4 | {1,1,1,1} + 100 | 5 | {2,1,0,0} + 101 | 6 | {1,2,0,1} + 110 | 7 | {1,2,1,1} + 002 | 11 | {0,3,1,1} + 111 | 12 | {2,2,2,0} +(9 rows) + +-- Switch table to be logged again +ALTER TABLE small_world SET LOGGED; +INFO: done init usearch index +INFO: inserted 9 elements +INFO: done saving 9 vectors +INFO: done init usearch index +INFO: inserted 9 elements +INFO: done saving 9 vectors +-- Create a new index +CREATE INDEX small_world_idx3 ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +INFO: done init usearch index +INFO: inserted 9 elements +INFO: done saving 9 vectors +-- Validate indexes +SELECT _lantern_internal.validate_index('small_world_idx', false); +INFO: validate_index() start for small_world_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +SELECT _lantern_internal.validate_index('small_world_idx2', false); +INFO: validate_index() start for small_world_idx2 +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +SELECT _lantern_internal.validate_index('small_world_idx3', false); +INFO: validate_index() start for small_world_idx3 +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +-- Insert +INSERT INTO small_world (id, vector) VALUES ('020', '{0,0,4,0}'); +-- Query +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + id | l2sq_dist | vector +-----+-----------+----------- + 000 | 1 | {1,0,0,0} + 001 | 2 | {1,0,0,1} + 010 | 3 | {1,1,1,0} + 011 | 4 | {1,1,1,1} + 100 | 5 | {2,1,0,0} + 101 | 6 | {1,2,0,1} + 110 | 7 | {1,2,1,1} + 002 | 11 | {0,3,1,1} + 111 | 12 | {2,2,2,0} + 020 | 16 | {0,0,4,0} +(10 rows) + +-- -------------------------- +-- Start with unlogged table +-- -------------------------- +DROP TABLE small_world; +CREATE UNLOGGED TABLE small_world ( + id varchar(3), + vector real[] +); +-- Insert (we insert data such that each vector has a unique distance from (0,0,0) +INSERT INTO small_world (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,1,1,0}'), +('011', '{1,1,1,1}'), +('100', '{2,1,0,0}'), +('101', '{1,2,0,1}'), +('110', '{1,2,1,1}'), +('111', '{2,2,2,0}'); +-- Create an index +CREATE INDEX small_world_idx ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +INFO: done init usearch index +INFO: inserted 8 elements +INFO: done saving 8 vectors +-- Validate index +SELECT _lantern_internal.validate_index('small_world_idx', false); +INFO: validate_index() start for small_world_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +-- Query +SET enable_seqscan = false; +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + id | l2sq_dist | vector +-----+-----------+----------- + 000 | 1 | {1,0,0,0} + 001 | 2 | {1,0,0,1} + 010 | 3 | {1,1,1,0} + 011 | 4 | {1,1,1,1} + 100 | 5 | {2,1,0,0} + 101 | 6 | {1,2,0,1} + 110 | 7 | {1,2,1,1} + 111 | 12 | {2,2,2,0} +(8 rows) + +-- Switch table to be logged +ALTER TABLE small_world SET LOGGED; +INFO: done init usearch index +INFO: inserted 8 elements +INFO: done saving 8 vectors +-- Create a new index +CREATE INDEX small_world_idx2 ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +INFO: done init usearch index +INFO: inserted 8 elements +INFO: done saving 8 vectors +-- Validate indexes +SELECT _lantern_internal.validate_index('small_world_idx', false); +INFO: validate_index() start for small_world_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +SELECT _lantern_internal.validate_index('small_world_idx2', false); +INFO: validate_index() start for small_world_idx2 +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +-- Insert +INSERT INTO small_world (id, vector) VALUES ('002', '{0,3,1,1}'); +-- Query +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + id | l2sq_dist | vector +-----+-----------+----------- + 000 | 1 | {1,0,0,0} + 001 | 2 | {1,0,0,1} + 010 | 3 | {1,1,1,0} + 011 | 4 | {1,1,1,1} + 100 | 5 | {2,1,0,0} + 101 | 6 | {1,2,0,1} + 110 | 7 | {1,2,1,1} + 002 | 11 | {0,3,1,1} + 111 | 12 | {2,2,2,0} +(9 rows) + +-- Switch table to be unlogged again +ALTER TABLE small_world SET UNLOGGED; +INFO: done init usearch index +INFO: inserted 9 elements +INFO: done saving 9 vectors +INFO: done init usearch index +INFO: inserted 9 elements +INFO: done saving 9 vectors +-- Create a new index +CREATE INDEX small_world_idx3 ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +INFO: done init usearch index +INFO: inserted 9 elements +INFO: done saving 9 vectors +-- Validate indexes +SELECT _lantern_internal.validate_index('small_world_idx', false); +INFO: validate_index() start for small_world_idx +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +SELECT _lantern_internal.validate_index('small_world_idx2', false); +INFO: validate_index() start for small_world_idx2 +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +SELECT _lantern_internal.validate_index('small_world_idx3', false); +INFO: validate_index() start for small_world_idx3 +INFO: validate_index() done, no issues found. + validate_index +---------------- + +(1 row) + +-- Insert +INSERT INTO small_world (id, vector) VALUES ('020', '{0,0,4,0}'); +-- Query +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + id | l2sq_dist | vector +-----+-----------+----------- + 000 | 1 | {1,0,0,0} + 001 | 2 | {1,0,0,1} + 010 | 3 | {1,1,1,0} + 011 | 4 | {1,1,1,1} + 100 | 5 | {2,1,0,0} + 101 | 6 | {1,2,0,1} + 110 | 7 | {1,2,1,1} + 002 | 11 | {0,3,1,1} + 111 | 12 | {2,2,2,0} + 020 | 16 | {0,0,4,0} +(10 rows) + diff --git a/test/schedule.txt b/test/schedule.txt index f8210d6cd..4aac98cd6 100644 --- a/test/schedule.txt +++ b/test/schedule.txt @@ -3,6 +3,6 @@ # - every test that needs to be run iff pgvector is installed appears in a 'test_pgvector:' line # - 'test' lines may have multiple space-separated tests. All tests in a single 'test' line will be run in parallel -test: hnsw_config hnsw_correct hnsw_create hnsw_create_expr hnsw_dist_func hnsw_insert hnsw_select hnsw_todo hnsw_index_from_file hnsw_cost_estimate ext_relocation hnsw_ef_search hnsw_failure_point hnsw_operators hnsw_blockmap_create +test: hnsw_config hnsw_correct hnsw_create hnsw_create_expr hnsw_dist_func hnsw_insert hnsw_select hnsw_todo hnsw_index_from_file hnsw_cost_estimate ext_relocation hnsw_ef_search hnsw_failure_point hnsw_operators hnsw_blockmap_create hnsw_create_unlogged hnsw_insert_unlogged hnsw_logged_unlogged test_pgvector: hnsw_vector test_extras: hnsw_extras diff --git a/test/sql/hnsw_create_unlogged.sql b/test/sql/hnsw_create_unlogged.sql new file mode 100644 index 000000000..768754b68 --- /dev/null +++ b/test/sql/hnsw_create_unlogged.sql @@ -0,0 +1,80 @@ +------------------------------------------------------------------------------ +-- Test HNSW index creation +------------------------------------------------------------------------------ + +-- Validate that index creation works with a small number of vectors +\ir utils/small_world_array_unlogged.sql +\ir utils/sift1k_array_unlogged.sql + +-- Validate that creating a secondary index works +CREATE INDEX ON sift_base1k USING hnsw (v) WITH (dim=128, M=4); +SELECT * FROM ldb_get_indexes('sift_base1k'); +SELECT _lantern_internal.validate_index('sift_base1k_v_idx', false); + +-- Validate that index creation works with a larger number of vectors +\ir utils/sift10k_array_unlogged.sql +SET lantern.pgvector_compat=FALSE; + +CREATE INDEX hnsw_idx ON sift_base10k USING hnsw (v dist_l2sq_ops) WITH (M=2, ef_construction=10, ef=4, dim=128); +SELECT v AS v4444 FROM sift_base10k WHERE id = 4444 \gset +EXPLAIN (COSTS FALSE) SELECT * FROM sift_base10k order by v :'v4444' LIMIT 10; +SELECT _lantern_internal.validate_index('hnsw_idx', false); + +--- Validate that M values inside the allowed range [2, 128] do not throw an error + +CREATE INDEX ON small_world USING hnsw (v) WITH (M=2); +CREATE INDEX ON small_world USING hnsw (v) WITH (M=128); + +---- Validate that M values outside the allowed range [2, 128] throw an error +\set ON_ERROR_STOP off +CREATE INDEX ON small_world USING hnsw (v) WITH (M=1); +CREATE INDEX ON small_world USING hnsw (v) WITH (M=129); +\set ON_ERROR_STOP on + +-- Validate index dimension inference +CREATE UNLOGGED TABLE small_world4 ( + id varchar(3), + vector real[] +); +-- If the first row is NULL we do not infer a dimension +\set ON_ERROR_STOP off +CREATE INDEX ON small_world4 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +begin; +INSERT INTO small_world4 (id, vector) VALUES +('000', NULL), +('001', '{1,0,0,1}'); +CREATE INDEX ON small_world4 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +rollback; +\set ON_ERROR_STOP on + +INSERT INTO small_world4 (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,0,1,0}'), +('011', '{1,0,1,1}'), +('100', '{1,1,0,0}'), +('101', '{1,1,0,1}'), +('110', '{1,1,1,0}'), +('111', '{1,1,1,1}'); +CREATE INDEX small_world4_hnsw_idx ON small_world4 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +SELECT * FROM ldb_get_indexes('small_world4'); +-- the index will not allow changing the dimension of a vector element +\set ON_ERROR_STOP off +UPDATE small_world4 SET vector = '{0,0,0}' WHERE id = '000'; +UPDATE small_world4 SET vector = '{0,0,0}' WHERE id = '001'; +\set ON_ERROR_STOP on + +INSERT INTO small_world4 (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,0,1,0}'); + +SELECT _lantern_internal.validate_index('small_world4_hnsw_idx', false); + +-- without the index, I can change the dimension of a vector element +DROP INDEX small_world4_hnsw_idx; +UPDATE small_world4 SET vector = '{0,0,0}' WHERE id = '001'; +-- but then, I cannot create the same dimension-inferred index +\set ON_ERROR_STOP off +CREATE INDEX ON small_world4 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +\set ON_ERROR_STOP on diff --git a/test/sql/hnsw_insert_unlogged.sql b/test/sql/hnsw_insert_unlogged.sql new file mode 100644 index 000000000..bf8066cea --- /dev/null +++ b/test/sql/hnsw_insert_unlogged.sql @@ -0,0 +1,94 @@ +--------------------------------------------------------------------- +-- Test HNSW index inserts on empty table +--------------------------------------------------------------------- +-- set an artificially low work_mem to make sure work_mem exceeded warnings are printed +set work_mem = '64kB'; +-- We do not actually print the warnings generated for exceeding work_mem because the work_mem +-- check does not work for postgres 13 and lower.So, if we printed the warnings, we would get a regression +-- failure in older postgres versions. We still reduce workmem to exercise relevant codepaths for coverage +set client_min_messages = 'ERROR'; + +CREATE UNLOGGED TABLE small_world ( + id SERIAL PRIMARY KEY, + v REAL[2] -- this demonstates that postgres actually does not enforce real[] length as we actually insert vectors of length 3 +); + +CREATE UNLOGGED TABLE small_world_int ( + id SERIAL PRIMARY KEY, + v INTEGER[] +); + +CREATE INDEX ON small_world USING hnsw (v) WITH (dim=3); +SELECT _lantern_internal.validate_index('small_world_v_idx', false); + +-- Insert rows with valid vector data +INSERT INTO small_world (v) VALUES ('{0,0,1}'), ('{0,1,0}'); +INSERT INTO small_world (v) VALUES (NULL); + +-- Attempt to insert a row with an incorrect vector length +\set ON_ERROR_STOP off +-- Cannot create an hnsw index with implicit typecasts (trying to cast integer[] to real[], in this case) +CREATE INDEX ON small_world_int USING hnsw (v dist_l2sq_ops) WITH (dim=3); +INSERT INTO small_world (v) VALUES ('{1,1,1,1}'); +\set ON_ERROR_STOP on + +DROP TABLE small_world; + +-- set work_mem to a value that is enough for the tests +set client_min_messages = 'WARNING'; +set work_mem = '10MB'; + +--------------------------------------------------------------------- +-- Test HNSW index inserts on non-empty table +--------------------------------------------------------------------- + +\ir utils/small_world_array_unlogged.sql + +CREATE INDEX ON small_world USING hnsw (v) WITH (dim=3); + +SET enable_seqscan = false; +SET lantern.pgvector_compat = false; + +-- Inserting vectors of the same dimension and nulls should work +INSERT INTO small_world (v) VALUES ('{1,1,2}'); +INSERT INTO small_world (v) VALUES (NULL); + +-- Inserting vectors of different dimension should fail +\set ON_ERROR_STOP off +INSERT INTO small_world (v) VALUES ('{4,4,4,4}'); +\set ON_ERROR_STOP on + +-- Verify that the index works with the inserted vectors +SELECT + ROUND(l2sq_dist(v, '{0,0,0}')::numeric, 2) +FROM + small_world +ORDER BY + v '{0,0,0}'; + +-- Ensure the index size remains consistent after inserts +SELECT * from ldb_get_indexes('small_world'); + +-- Ensure the query plan remains consistent after inserts +EXPLAIN (COSTS FALSE) +SELECT + ROUND(l2sq_dist(v, '{0,0,0}')::numeric, 2) +FROM + small_world +ORDER BY + v '{0,0,0}' +LIMIT 10; + +SELECT _lantern_internal.validate_index('small_world_v_idx', false); + +-- Test the index with a larger number of vectors +CREATE UNLOGGED TABLE sift_base10k ( + id SERIAL PRIMARY KEY, + v REAL[128] +); +CREATE INDEX hnsw_idx ON sift_base10k USING hnsw (v dist_l2sq_ops) WITH (M=2, ef_construction=10, ef=4, dim=128); +\COPY sift_base10k (v) FROM '/tmp/lantern/vector_datasets/siftsmall_base_arrays.csv' WITH CSV; +SELECT v AS v4444 FROM sift_base10k WHERE id = 4444 \gset +EXPLAIN (COSTS FALSE) SELECT * FROM sift_base10k order by v :'v4444'; + +SELECT _lantern_internal.validate_index('hnsw_idx', false); diff --git a/test/sql/hnsw_logged_unlogged.sql b/test/sql/hnsw_logged_unlogged.sql new file mode 100644 index 000000000..fe4d7700a --- /dev/null +++ b/test/sql/hnsw_logged_unlogged.sql @@ -0,0 +1,138 @@ +-- Test changing tables from logged to unlogged, and from unlogged to logged + +-- -------------------------- +-- Start with logged table +-- -------------------------- +CREATE TABLE small_world ( + id varchar(3), + vector real[] +); + +-- Insert (we insert data such that each vector has a unique distance from (0,0,0) +INSERT INTO small_world (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,1,1,0}'), +('011', '{1,1,1,1}'), +('100', '{2,1,0,0}'), +('101', '{1,2,0,1}'), +('110', '{1,2,1,1}'), +('111', '{2,2,2,0}'); + + +-- Create an index +CREATE INDEX small_world_idx ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); + +-- Validate index +SELECT _lantern_internal.validate_index('small_world_idx', false); + +-- Query +SET enable_seqscan = false; +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + + +-- Switch table to be unlogged +ALTER TABLE small_world SET UNLOGGED; + +-- Create a new index +CREATE INDEX small_world_idx2 ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); + +-- Validate indexes +SELECT _lantern_internal.validate_index('small_world_idx', false); +SELECT _lantern_internal.validate_index('small_world_idx2', false); + +-- Insert +INSERT INTO small_world (id, vector) VALUES ('002', '{0,3,1,1}'); + +-- Query +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + + +-- Switch table to be logged again +ALTER TABLE small_world SET LOGGED; + +-- Create a new index +CREATE INDEX small_world_idx3 ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); + +-- Validate indexes +SELECT _lantern_internal.validate_index('small_world_idx', false); +SELECT _lantern_internal.validate_index('small_world_idx2', false); +SELECT _lantern_internal.validate_index('small_world_idx3', false); + +-- Insert +INSERT INTO small_world (id, vector) VALUES ('020', '{0,0,4,0}'); + +-- Query +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + + +-- -------------------------- +-- Start with unlogged table +-- -------------------------- +DROP TABLE small_world; + +CREATE UNLOGGED TABLE small_world ( + id varchar(3), + vector real[] +); + +-- Insert (we insert data such that each vector has a unique distance from (0,0,0) +INSERT INTO small_world (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,1,1,0}'), +('011', '{1,1,1,1}'), +('100', '{2,1,0,0}'), +('101', '{1,2,0,1}'), +('110', '{1,2,1,1}'), +('111', '{2,2,2,0}'); + + +-- Create an index +CREATE INDEX small_world_idx ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); + +-- Validate index +SELECT _lantern_internal.validate_index('small_world_idx', false); + +-- Query +SET enable_seqscan = false; +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + + +-- Switch table to be logged +ALTER TABLE small_world SET LOGGED; + +-- Create a new index +CREATE INDEX small_world_idx2 ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); + +-- Validate indexes +SELECT _lantern_internal.validate_index('small_world_idx', false); +SELECT _lantern_internal.validate_index('small_world_idx2', false); + +-- Insert +INSERT INTO small_world (id, vector) VALUES ('002', '{0,3,1,1}'); + +-- Query +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + + + +-- Switch table to be unlogged again +ALTER TABLE small_world SET UNLOGGED; + +-- Create a new index +CREATE INDEX small_world_idx3 ON small_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); + +-- Validate indexes +SELECT _lantern_internal.validate_index('small_world_idx', false); +SELECT _lantern_internal.validate_index('small_world_idx2', false); +SELECT _lantern_internal.validate_index('small_world_idx3', false); + +-- Insert +INSERT INTO small_world (id, vector) VALUES ('020', '{0,0,4,0}'); + +-- Query +SELECT id, l2sq_dist(vector, '{0, 0, 0, 0}'), vector FROM small_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + + + diff --git a/test/sql/manual_tests/hnsw_unlogged_post.sql b/test/sql/manual_tests/hnsw_unlogged_post.sql new file mode 100644 index 000000000..686ceb8da --- /dev/null +++ b/test/sql/manual_tests/hnsw_unlogged_post.sql @@ -0,0 +1,58 @@ +-- INSTRUCTIONS +-- this test is only to be run after running the `hnsw_unlogged_pre.sql` test and crashing postgres + +-- Validate recovered unlogged index structure (postgres should have moved the init fork data for these indexes to their main forks) +SELECT _lantern_internal.validate_index('unlogged_world1_hnsw_idx', true); +--SELECT _lantern_internal.validate_index('unlogged_world2_hnsw_idx', true); +SELECT _lantern_internal.validate_index('unlogged_world3_hnsw_idx', true); +SELECT _lantern_internal.validate_index('unlogged_world4_hnsw_idx', true); +SELECT _lantern_internal.validate_index('morph_world_hnsw_idx', true); +SELECT _lantern_internal.validate_index('morph_world2_hnsw_idx', true); + +-- Verify that the tables are now in fact empty after the crash, since tables are unlogged +SELECT * from unlogged_world1; +--SELECT * from unlogged_world2; +SELECT * from unlogged_world3; +SELECT * from unlogged_world4; +SELECT * from morph_world; +SELECT * from morph_world2; + +-- Verify that the indexes are operational +set enable_seqscan = false; +set enable_indexscan = true; + +-- These should use an index scan and return nothing (since table is empty) +EXPLAIN SELECT * FROM unlogged_world1 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; +SELECT * FROM unlogged_world1 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + +--EXPLAIN SELECT * FROM unlogged_world2 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; +--SELECT * FROM unlogged_world2 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + +EXPLAIN SELECT * FROM unlogged_world3 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; +SELECT * FROM unlogged_world3 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + +EXPLAIN SELECT * FROM unlogged_world4 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; +SELECT * FROM unlogged_world4 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + +EXPLAIN SELECT * FROM morph_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; +SELECT * FROM morph_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + +EXPLAIN SELECT * FROM morph_world2 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; +SELECT * FROM morph_world2 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; + +-- Insert data into each one +INSERT INTO unlogged_world1 (id, vector) VALUES ('101', '{1,2,3,4}'); +--INSERT INTO unlogged_world2 (id, vector) VALUES ('101', '{1,2,3,4}'); +INSERT INTO unlogged_world3 (id, vector) VALUES ('101', '{1,2,3,4}'); +INSERT INTO unlogged_world4 (id, vector) VALUES ('101', '{1,2,3,4}'); +INSERT INTO morph_world (id, vector) VALUES ('101', '{1,2,3,4}'); +INSERT INTO morph_world2 (id, vector) VALUES ('101', '{1,2,3,4}'); + + +-- Test queries after new data inserted +SELECT * FROM unlogged_world1 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; +--SELECT * FROM unlogged_world2 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; +SELECT * FROM unlogged_world3 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; +SELECT * FROM unlogged_world4 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; +SELECT * FROM morph_world ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; +SELECT * FROM morph_world2 ORDER BY vector <-> ARRAY[0, 0, 0, 0] LIMIT 10; diff --git a/test/sql/manual_tests/hnsw_unlogged_pre.sql b/test/sql/manual_tests/hnsw_unlogged_pre.sql new file mode 100644 index 000000000..cc573bd3d --- /dev/null +++ b/test/sql/manual_tests/hnsw_unlogged_pre.sql @@ -0,0 +1,139 @@ +-- INSTRUCTIONS +-- run this file first, and then crash +-- then, run the `hnsw_unlogged_post.sql` test + +DROP TABLE IF EXISTS unlogged_world1; +DROP TABLE IF EXISTS unlogged_world2; +DROP TABLE IF EXISTS unlogged_world3; +DROP TABLE IF EXISTS unlogged_world4; + +-- Explanation of tables +-- unlogged_world1: empty, dimension specified in index +-- unlogged_world2: empty, dimension not specified in index (this will error for now, ignored at the moment) +-- unlogged_world3: non-empty, dimension specified in index +-- unlogged_world4: non-empty, dimension not specified in index + +-- morph_world: will start as unlogged and then be altered to logged; non-empty, dimension not specified +-- morph_world2: will start as logged and then be altered to unlogged; non-empty, dimension not specified + + +CREATE UNLOGGED TABLE unlogged_world1 ( + id varchar(3), + vector real[] +); + +/* +CREATE UNLOGGED TABLE unlogged_world2 ( + id varchar(3), + vector real[] +); +*/ + +CREATE UNLOGGED TABLE unlogged_world3 ( + id varchar(3), + vector real[] +); + +CREATE UNLOGGED TABLE unlogged_world4 ( + id varchar(3), + vector real[] +); + +CREATE UNLOGGED TABLE morph_world ( + id varchar(3), + vector real[] +); + +CREATE TABLE morph_world2 ( + id varchar(3), + vector real[] +); + +-- Insert data into some tables + +INSERT INTO unlogged_world3 (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,0,1,0}'), +('011', '{1,0,1,1}'), +('100', '{1,1,0,0}'), +('101', '{1,1,0,1}'), +('110', '{1,1,1,0}'), +('111', '{1,1,1,1}'); + +INSERT INTO unlogged_world4 (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,0,1,0}'), +('011', '{1,0,1,1}'), +('100', '{1,1,0,0}'), +('101', '{1,1,0,1}'), +('110', '{1,1,1,0}'), +('111', '{1,1,1,1}'); + +INSERT INTO morph_world (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,0,1,0}'), +('011', '{1,0,1,1}'), +('100', '{1,1,0,0}'), +('101', '{1,1,0,1}'), +('110', '{1,1,1,0}'), +('111', '{1,1,1,1}'); + +INSERT INTO morph_world2 (id, vector) VALUES +('000', '{1,0,0,0}'), +('001', '{1,0,0,1}'), +('010', '{1,0,1,0}'), +('011', '{1,0,1,1}'), +('100', '{1,1,0,0}'), +('101', '{1,1,0,1}'), +('110', '{1,1,1,0}'), +('111', '{1,1,1,1}'); + + +-- Change table status +ALTER TABLE morph_world SET LOGGED; + +ALTER TABLE morph_world2 SET UNLOGGED; + + +-- Verify contents of unlogged tables pre-crash +SELECT * from unlogged_world1; +--SELECT * from unlogged_world2; +SELECT * from unlogged_world3; +SELECT * from unlogged_world4; +SELECT * from morph_world; +SELECT * from morph_world2; + + +-- Create indexes +CREATE INDEX unlogged_world1_hnsw_idx ON unlogged_world1 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2, dim=4); +--CREATE INDEX unlogged_world2_hnsw_idx ON unlogged_world2 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +CREATE INDEX unlogged_world3_hnsw_idx ON unlogged_world3 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2, dim=4); +CREATE INDEX unlogged_world4_hnsw_idx ON unlogged_world4 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +CREATE INDEX morph_world_hnsw_idx ON morph_world USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); +CREATE INDEX morph_world2_hnsw_idx ON morph_world2 USING hnsw (vector) WITH (M=14, ef=22, ef_construction=2); + + + +-- Validate indexes pre-crash +SELECT _lantern_internal.validate_index('unlogged_world1_hnsw_idx', true); +--SELECT _lantern_internal.validate_index('unlogged_world2_hnsw_idx', true); +SELECT _lantern_internal.validate_index('unlogged_world3_hnsw_idx', true); +SELECT _lantern_internal.validate_index('unlogged_world4_hnsw_idx', true); +SELECT _lantern_internal.validate_index('morph_world_hnsw_idx', true); +SELECT _lantern_internal.validate_index('morph_world2_hnsw_idx', true); + + + +-- Now, we crash the database (todo:: find a way to do this programatically from within this .sql file?) +-- We can do this in one of two ways. Either: +-- 1. Find pid of master pg process using `ps aux | grep postgres` and then kill it with `kill -9` +-- OR +-- 2. `pg_ctl stop -D {PGDATA DIRECTORY} -m immediate` + +-- After crashing, restart it with: +-- sudo systemctl restart postgresql + +-- Then, run `hnsw_unlogged_post.sql` \ No newline at end of file diff --git a/test/sql/utils/sift10k_array_unlogged.sql b/test/sql/utils/sift10k_array_unlogged.sql new file mode 100644 index 000000000..626f08cc5 --- /dev/null +++ b/test/sql/utils/sift10k_array_unlogged.sql @@ -0,0 +1,5 @@ +CREATE UNLOGGED TABLE IF NOT EXISTS sift_base10k ( + id SERIAL PRIMARY KEY, + v REAL[128] +); +\copy sift_base10k (v) FROM '/tmp/lantern/vector_datasets/siftsmall_base_arrays.csv' with csv; \ No newline at end of file diff --git a/test/sql/utils/sift1k_array_unlogged.sql b/test/sql/utils/sift1k_array_unlogged.sql new file mode 100644 index 000000000..b984a75f5 --- /dev/null +++ b/test/sql/utils/sift1k_array_unlogged.sql @@ -0,0 +1,6 @@ +CREATE UNLOGGED TABLE IF NOT EXISTS sift_base1k ( + id SERIAL, + v REAL[] +); + +COPY sift_base1k (v) FROM '/tmp/lantern/vector_datasets/sift_base1k_arrays.csv' WITH csv; diff --git a/test/sql/utils/small_world_array_unlogged.sql b/test/sql/utils/small_world_array_unlogged.sql new file mode 100644 index 000000000..671cd0bd0 --- /dev/null +++ b/test/sql/utils/small_world_array_unlogged.sql @@ -0,0 +1,15 @@ +CREATE UNLOGGED TABLE small_world ( + id VARCHAR(3), + b BOOLEAN, + v REAL[3] +); + +INSERT INTO small_world (id, b, v) VALUES + ('000', TRUE, '{0,0,0}'), + ('001', TRUE, '{0,0,1}'), + ('010', FALSE, '{0,1,0}'), + ('011', TRUE, '{0,1,1}'), + ('100', FALSE, '{1,0,0}'), + ('101', FALSE, '{1,0,1}'), + ('110', FALSE, '{1,1,0}'), + ('111', TRUE, '{1,1,1}');