Skip to content

Commit

Permalink
Update param values and add new procedure (opensearch-project#249)
Browse files Browse the repository at this point in the history
Update param value to get optimal recall during nightly runs.
Added a new procedure which includes index and merge segments.
This will be helpful to prepare snapshot for search-only
nightly runs.

Signed-off-by: Vijayan Balasubramanian <balasvij@amazon.com>
  • Loading branch information
VijayanB authored and harshavamsi committed Jul 16, 2024
1 parent 2e21650 commit 340093e
Show file tree
Hide file tree
Showing 7 changed files with 33 additions and 21 deletions.
9 changes: 5 additions & 4 deletions vectorsearch/params/corpus/10million/faiss-cohere-768-dp.json
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,8 @@
"target_index_name": "target_index",
"target_field_name": "target_field",
"target_index_body": "indices/faiss-index.json",
"target_index_primary_shards": 18,
"target_index_primary_shards": 6,
"target_index_replica_shards": 1,
"target_index_dimension": 768,
"target_index_space_type": "innerproduct",

Expand All @@ -11,9 +12,9 @@
"target_index_bulk_index_data_set_corpus": "cohere-10m",
"target_index_bulk_indexing_clients": 10,

"target_index_max_num_segments": 10,
"hnsw_ef_search": 100,
"hnsw_ef_construction": 100,
"target_index_max_num_segments": 1,
"hnsw_ef_search": 256,
"hnsw_ef_construction": 256,

"query_k": 100,
"query_body": {
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,8 @@
"target_index_name": "target_index",
"target_field_name": "target_field",
"target_index_body": "indices/lucene-index.json",
"target_index_primary_shards": 18,
"target_index_primary_shards": 6,
"target_index_replica_shards": 1,
"target_index_dimension": 768,
"target_index_space_type": "innerproduct",

Expand All @@ -11,9 +12,9 @@
"target_index_bulk_index_data_set_corpus": "cohere-10m",
"target_index_bulk_indexing_clients": 10,

"target_index_max_num_segments": 10,
"hnsw_ef_search": 100,
"hnsw_ef_construction": 100,
"target_index_max_num_segments": 1,
"hnsw_ef_search": 256,
"hnsw_ef_construction": 256,

"query_k": 100,
"query_body": {
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,8 @@
"target_index_name": "target_index",
"target_field_name": "target_field",
"target_index_body": "indices/nmslib-index.json",
"target_index_primary_shards": 18,
"target_index_primary_shards": 6,
"target_index_replica_shards": 1,
"target_index_dimension": 768,
"target_index_space_type": "innerproduct",

Expand All @@ -11,9 +12,9 @@
"target_index_bulk_index_data_set_corpus": "cohere-10m",
"target_index_bulk_indexing_clients": 10,

"target_index_max_num_segments": 10,
"hnsw_ef_search": 100,
"hnsw_ef_construction": 100,
"target_index_max_num_segments": 1,
"hnsw_ef_search": 256,
"hnsw_ef_construction": 256,

"query_k": 100,
"query_body": {
Expand Down
6 changes: 3 additions & 3 deletions vectorsearch/params/corpus/1million/faiss-cohere-768-dp.json
Original file line number Diff line number Diff line change
Expand Up @@ -11,9 +11,9 @@
"target_index_bulk_index_data_set_corpus": "cohere-1m",
"target_index_bulk_indexing_clients": 10,

"target_index_max_num_segments": 10,
"hnsw_ef_search": 100,
"hnsw_ef_construction": 100,
"target_index_max_num_segments": 1,
"hnsw_ef_search": 256,
"hnsw_ef_construction": 256,

"query_k": 100,
"query_body": {
Expand Down
6 changes: 3 additions & 3 deletions vectorsearch/params/corpus/1million/lucene-cohere-768-dp.json
Original file line number Diff line number Diff line change
Expand Up @@ -11,9 +11,9 @@
"target_index_bulk_index_data_set_corpus": "cohere-1m",
"target_index_bulk_indexing_clients": 10,

"target_index_max_num_segments": 10,
"hnsw_ef_search": 100,
"hnsw_ef_construction": 100,
"target_index_max_num_segments": 1,
"hnsw_ef_search": 256,
"hnsw_ef_construction": 256,

"query_k": 100,
"query_body": {
Expand Down
6 changes: 3 additions & 3 deletions vectorsearch/params/corpus/1million/nmslib-cohere-768-dp.json
Original file line number Diff line number Diff line change
Expand Up @@ -11,9 +11,9 @@
"target_index_bulk_index_data_set_corpus": "cohere-1m",
"target_index_bulk_indexing_clients": 10,

"target_index_max_num_segments": 10,
"hnsw_ef_search": 100,
"hnsw_ef_construction": 100,
"target_index_max_num_segments": 1,
"hnsw_ef_search": 256,
"hnsw_ef_construction": 256,

"query_k": 100,
"query_body": {
Expand Down
9 changes: 9 additions & 0 deletions vectorsearch/test_procedures/default.json
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,15 @@
{{ benchmark.collect(parts="common/index-only-schedule.json") }}
]
},
{
"name": "no-train-test-index-with-merge",
"description": "Perform only indexing operation for vector search",
"default": false,
"schedule": [
{{ benchmark.collect(parts="common/index-only-schedule.json") }},
{{ benchmark.collect(parts="common/force-merge-schedule.json") }},
]
},
{
"name": "search-only",
"default": false,
Expand Down

0 comments on commit 340093e

Please sign in to comment.