diff --git a/cpp_src/CMakeLists.txt b/cpp_src/CMakeLists.txt index 8bfc3150d..c47953a94 100644 --- a/cpp_src/CMakeLists.txt +++ b/cpp_src/CMakeLists.txt @@ -53,25 +53,28 @@ include (TargetArch) target_architecture(COMPILER_TARGET_ARCH) # Configure compile options -string(REPLACE "-DNDEBUG" "" CMAKE_CXX_FLAGS_RELWITHDEBINFO "${CMAKE_CXX_FLAGS_RELWITHDEBINFO}") -string(REPLACE "-O2" "-O3" CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS}") -string(REPLACE "-O2" "-O3" CMAKE_C_FLAGS "${CMAKE_C_FLAGS}") -if (NOT ${COMPILER_TARGET_ARCH} STREQUAL "e2k") - string(REPLACE "-g" "-g1" CMAKE_CXX_FLAGS_RELWITHDEBINFO "${CMAKE_CXX_FLAGS_RELWITHDEBINFO}") -else() - string(REPLACE "-g" "-g0" CMAKE_CXX_FLAGS_RELWITHDEBINFO "${CMAKE_CXX_FLAGS_RELWITHDEBINFO}") -endif() - +if (MSVC) + set(CMAKE_CXX_FLAGS_RELWITHDEBINFO "-O2 -g1") + set(CMAKE_C_FLAGS_RELWITHDEBINFO "-O2 -g1") + set(CMAKE_CXX_FLAGS_RELEASE "-O2 -DNDEBUG") + set(CMAKE_C_FLAGS_RELEASE "-O2 -DNDEBUG") +else () + set(CMAKE_CXX_FLAGS_RELWITHDEBINFO "-O3 -g1") + set(CMAKE_C_FLAGS_RELWITHDEBINFO "-O3 -g1") + set(CMAKE_CXX_FLAGS_RELEASE "-O3 -DNDEBUG") + set(CMAKE_C_FLAGS_RELEASE "-O3 -DNDEBUG") +endif () if (${COMPILER_TARGET_ARCH} STREQUAL "e2k") + set(CMAKE_CXX_FLAGS_RELWITHDEBINFO "-O3 -g0") add_definitions(-D__E2K__) add_definitions(-D__LCC__) -endif() +endif () if (NOT MSVC AND NOT APPLE) check_linker_flag (-gz cxx_linker_supports_gz) if (cxx_linker_supports_gz) - set (CMAKE_EXE_LINKER_FLAGS_RELWITHDEBINFO "${CMAKE_EXE_LINKER_FLAGS_RELWITHDEBINFO} -gz") - endif () + set (CMAKE_EXE_LINKER_FLAGS_RELWITHDEBINFO "${CMAKE_EXE_LINKER_FLAGS_RELWITHDEBINFO} -gz") + endif () endif () if (MSVC) diff --git a/cpp_src/cmd/reindexer_server/test/test_storage_compatibility.sh b/cpp_src/cmd/reindexer_server/test/test_storage_compatibility.sh new file mode 100755 index 000000000..d189d3841 --- /dev/null +++ b/cpp_src/cmd/reindexer_server/test/test_storage_compatibility.sh @@ -0,0 +1,195 @@ +#!/bin/bash +# Task: https://github.com/restream/reindexer/-/issues/1188 +set -e + +function KillAndRemoveServer { + local pid=$1 + kill $pid + wait $pid + yum remove -y 'reindexer*' > /dev/null +} + +function WaitForDB { + # wait until DB is loaded + set +e # disable "exit on error" so the script won't stop when DB's not loaded yet + is_connected=$(reindexer_tool --dsn $ADDRESS --command '\databases list'); + while [[ $is_connected != "test" ]] + do + sleep 2 + is_connected=$(reindexer_tool --dsn $ADDRESS --command '\databases list'); + done + set -e +} + +function CompareNamespacesLists { + local ns_list_actual=$1 + local ns_list_expected=$2 + local pid=$3 + + diff=$(echo ${ns_list_actual[@]} ${ns_list_expected[@]} | tr ' ' '\n' | sort | uniq -u) # compare in any order + if [ "$diff" == "" ]; then + echo "## PASS: namespaces list not changed" + else + echo "##### FAIL: namespaces list was changed" + echo "expected: $ns_list_expected" + echo "actual: $ns_list_actual" + KillAndRemoveServer $pid; + exit 1 + fi +} + +function CompareMemstats { + local actual=$1 + local expected=$2 + local pid=$3 + diff=$(echo ${actual[@]} ${expected[@]} | tr ' ' '\n' | sed 's/\(.*\),$/\1/' | sort | uniq -u) # compare in any order + if [ "$diff" == "" ]; then + echo "## PASS: memstats not changed" + else + echo "##### FAIL: memstats was changed" + echo "expected: $expected" + echo "actual: $actual" + KillAndRemoveServer $pid; + exit 1 + fi +} + + +RX_SERVER_CURRENT_VERSION_RPM="$(basename build/reindexer-*server*.rpm)" +VERSION_FROM_RPM=$(echo "$RX_SERVER_CURRENT_VERSION_RPM" | grep -o '.*server-..') +VERSION=$(echo ${VERSION_FROM_RPM: -2:1}) # one-digit version + +echo "## choose latest release rpm file" +if [ $VERSION == 3 ]; then + LATEST_RELEASE=$(python3 cpp_src/cmd/reindexer_server/test/get_last_rx_version.py -v 3) + namespaces_list_expected=$'purchase_options_ext_dict\nchild_account_recommendations\n#config\n#activitystats\nradio_channels\ncollections\n#namespaces\nwp_imports_tasks\nepg_genres\nrecom_media_items_personal\nrecom_epg_archive_default\n#perfstats\nrecom_epg_live_default\nmedia_view_templates\nasset_video_servers\nwp_tasks_schedule\nadmin_roles\n#clientsstats\nrecom_epg_archive_personal\nrecom_media_items_similars\nmenu_items\naccount_recommendations\nkaraoke_items\nmedia_items\nbanners\n#queriesperfstats\nrecom_media_items_default\nrecom_epg_live_personal\nservices\n#memstats\nchannels\nmedia_item_recommendations\nwp_tasks_tasks\nepg' +elif [ $VERSION == 4 ]; then + LATEST_RELEASE=$(python3 cpp_src/cmd/reindexer_server/test/get_last_rx_version.py -v 4) + # replicationstats ns added for v4 + namespaces_list_expected=$'purchase_options_ext_dict\nchild_account_recommendations\n#config\n#activitystats\n#replicationstats\nradio_channels\ncollections\n#namespaces\nwp_imports_tasks\nepg_genres\nrecom_media_items_personal\nrecom_epg_archive_default\n#perfstats\nrecom_epg_live_default\nmedia_view_templates\nasset_video_servers\nwp_tasks_schedule\nadmin_roles\n#clientsstats\nrecom_epg_archive_personal\nrecom_media_items_similars\nmenu_items\naccount_recommendations\nkaraoke_items\nmedia_items\nbanners\n#queriesperfstats\nrecom_media_items_default\nrecom_epg_live_personal\nservices\n#memstats\nchannels\nmedia_item_recommendations\nwp_tasks_tasks\nepg' +else + echo "Unknown version" + exit 1 +fi + +echo "## downloading latest release rpm file: $LATEST_RELEASE" +curl "http://repo.itv.restr.im/itv-api-ng/7/x86_64/$LATEST_RELEASE" --output $LATEST_RELEASE; +echo "## downloading example DB" +curl "https://git.restream.ru/MaksimKravchuk/reindexer_testdata/-/raw/master/big.zip" --output big.zip; +unzip -o big.zip # unzips into mydb_big.rxdump; + +ADDRESS="cproto://127.0.0.1:6534/" +DB_NAME="test" + +memstats_expected=$'[ +{"replication":{"data_hash":24651210926,"data_count":3}}, +{"replication":{"data_hash":6252344969,"data_count":1}}, +{"replication":{"data_hash":37734732881,"data_count":28}}, +{"replication":{"data_hash":0,"data_count":0}}, +{"replication":{"data_hash":1024095024522,"data_count":1145}}, +{"replication":{"data_hash":8373644068,"data_count":1315}}, +{"replication":{"data_hash":0,"data_count":0}}, +{"replication":{"data_hash":0,"data_count":0}}, +{"replication":{"data_hash":0,"data_count":0}}, +{"replication":{"data_hash":0,"data_count":0}}, +{"replication":{"data_hash":7404222244,"data_count":97}}, +{"replication":{"data_hash":94132837196,"data_count":4}}, +{"replication":{"data_hash":1896088071,"data_count":2}}, +{"replication":{"data_hash":0,"data_count":0}}, +{"replication":{"data_hash":-672103903,"data_count":33538}}, +{"replication":{"data_hash":0,"data_count":0}}, +{"replication":{"data_hash":6833710705,"data_count":1}}, +{"replication":{"data_hash":5858155773472,"data_count":4500}}, +{"replication":{"data_hash":-473221280268823592,"data_count":65448}}, +{"replication":{"data_hash":0,"data_count":0}}, +{"replication":{"data_hash":8288213744,"data_count":3}}, +{"replication":{"data_hash":0,"data_count":0}}, +{"replication":{"data_hash":0,"data_count":0}}, +{"replication":{"data_hash":354171024786967,"data_count":3941}}, +{"replication":{"data_hash":-6520334670,"data_count":35886}}, +{"replication":{"data_hash":112772074632,"data_count":281}}, +{"replication":{"data_hash":-12679568198538,"data_count":1623116}} +] +Returned 27 rows' + +echo "##### Forward compatibility test #####" + +DB_PATH=$(pwd)"/rx_db" + +echo "Database: "$DB_PATH + +echo "## installing latest release: $LATEST_RELEASE" +yum install -y $LATEST_RELEASE > /dev/null; +# run RX server with disabled logging +reindexer_server -l warning --httplog=none --rpclog=none --db $DB_PATH & +server_pid=$! +sleep 2; + +reindexer_tool --dsn $ADDRESS$DB_NAME -f mydb_big.rxdump --createdb; +sleep 1; + +namespaces_1=$(reindexer_tool --dsn $ADDRESS$DB_NAME --command '\namespaces list'); +echo $namespaces_1; +CompareNamespacesLists "${namespaces_1[@]}" "${namespaces_list_expected[@]}" $server_pid; + +memstats_1=$(reindexer_tool --dsn $ADDRESS$DB_NAME --command 'select replication.data_hash, replication.data_count from #memstats'); +CompareMemstats "${memstats_1[@]}" "${memstats_expected[@]}" $server_pid; + +KillAndRemoveServer $server_pid; + +echo "## installing current version: $RX_SERVER_CURRENT_VERSION_RPM" +yum install -y build/*.rpm > /dev/null; +reindexer_server -l0 --corelog=none --httplog=none --rpclog=none --db $DB_PATH & +server_pid=$! +sleep 2; + +WaitForDB + +namespaces_2=$(reindexer_tool --dsn $ADDRESS$DB_NAME --command '\namespaces list'); +echo $namespaces_2; +CompareNamespacesLists "${namespaces_2[@]}" "${namespaces_1[@]}" $server_pid; + +memstats_2=$(reindexer_tool --dsn $ADDRESS$DB_NAME --command 'select replication.data_hash, replication.data_count from #memstats'); +CompareMemstats "${memstats_2[@]}" "${memstats_1[@]}" $server_pid; + +KillAndRemoveServer $server_pid; +rm -rf $DB_PATH; +sleep 1; + +echo "##### Backward compatibility test #####" + +echo "## installing current version: $RX_SERVER_CURRENT_VERSION_RPM" +yum install -y build/*.rpm > /dev/null; +reindexer_server -l warning --httplog=none --rpclog=none --db $DB_PATH & +server_pid=$! +sleep 2; + +reindexer_tool --dsn $ADDRESS$DB_NAME -f mydb_big.rxdump --createdb; +sleep 1; + +namespaces_3=$(reindexer_tool --dsn $ADDRESS$DB_NAME --command '\namespaces list'); +echo $namespaces_3; +CompareNamespacesLists "${namespaces_3[@]}" "${namespaces_list_expected[@]}" $server_pid; + +memstats_3=$(reindexer_tool --dsn $ADDRESS$DB_NAME --command 'select replication.data_hash, replication.data_count from #memstats'); +CompareMemstats "${memstats_3[@]}" "${memstats_expected[@]}" $server_pid; + +KillAndRemoveServer $server_pid; + +echo "## installing latest release: $LATEST_RELEASE" +yum install -y $LATEST_RELEASE > /dev/null; +reindexer_server -l warning --httplog=none --rpclog=none --db $DB_PATH & +server_pid=$! +sleep 2; + +WaitForDB + +namespaces_4=$(reindexer_tool --dsn $ADDRESS$DB_NAME --command '\namespaces list'); +echo $namespaces_4; +CompareNamespacesLists "${namespaces_4[@]}" "${namespaces_3[@]}" $server_pid; + +memstats_4=$(reindexer_tool --dsn $ADDRESS$DB_NAME --command 'select replication.data_hash, replication.data_count from #memstats'); +CompareMemstats "${memstats_4[@]}" "${memstats_3[@]}" $server_pid; + +KillAndRemoveServer $server_pid; +rm -rf $DB_PATH; diff --git a/cpp_src/cmd/reindexer_tool/commandsexecutor.cc b/cpp_src/cmd/reindexer_tool/commandsexecutor.cc index 77c3abb70..1b5853d70 100644 --- a/cpp_src/cmd/reindexer_tool/commandsexecutor.cc +++ b/cpp_src/cmd/reindexer_tool/commandsexecutor.cc @@ -191,7 +191,43 @@ Error CommandsExecutor::runImpl(const std::string& dsn, Args&&... a using reindexer::net::ev::sig; assertrx(!executorThr_.joinable()); - auto fn = [this](const std::string& dsn, Args&&... args) { + auto fnLoop = [this](const std::string& dsn, Args&&... args) { + std::string outputMode; + Error err; + if (reindexer::fs::ReadFile(reindexer::fs::JoinPath(reindexer::fs::GetHomeDir(), kConfigFile), outputMode) > 0) { + try { + gason::JsonParser jsonParser; + gason::JsonNode value = jsonParser.Parse(reindexer::giftStr(outputMode)); + for (auto node : value) { + WrSerializer ser; + reindexer::jsonValueToString(node.value, ser, 0, 0, false); + variables_[kVariableOutput] = std::string(ser.Slice()); + } + } catch (const gason::Exception& e) { + err = Error(errParseJson, "Unable to parse output mode: %s", e.what()); + } + } + if (err.ok() && variables_.empty()) { + variables_[kVariableOutput] = kOutputModeJson; + } + if (err.ok() && !uri_.parse(dsn)) { + err = Error(errNotValid, "Cannot connect to DB: Not a valid uri"); + } + if (err.ok()) err = db().Connect(dsn, std::forward(args)...); + if (err.ok()) { + loop_.spawn( + [this] { + // This coroutine should prevent loop from stopping for core::Reindexer + stopCh_.pop(); + }, + k8KStack); + } + std::lock_guard lck(mtx_); + status_.running = err.ok(); + status_.err = std::move(err); + }; + + auto fnThread = [this, &fnLoop](const std::string& dsn, Args&&... args) { sig sint; sint.set(loop_); sint.set([this](sig&) { cancelCtx_.Cancel(); }); @@ -214,49 +250,13 @@ Error CommandsExecutor::runImpl(const std::string& dsn, Args&&... a }); }); cmdAsync_.start(); - - auto fn = [this](const std::string& dsn, Args&&... args) { - std::string outputMode; - Error err; - if (reindexer::fs::ReadFile(reindexer::fs::JoinPath(reindexer::fs::GetHomeDir(), kConfigFile), outputMode) > 0) { - try { - gason::JsonParser jsonParser; - gason::JsonNode value = jsonParser.Parse(reindexer::giftStr(outputMode)); - for (auto node : value) { - WrSerializer ser; - reindexer::jsonValueToString(node.value, ser, 0, 0, false); - variables_[kVariableOutput] = std::string(ser.Slice()); - } - } catch (const gason::Exception& e) { - err = Error(errParseJson, "Unable to parse output mode: %s", e.what()); - } - } - if (err.ok() && variables_.empty()) { - variables_[kVariableOutput] = kOutputModeJson; - } - if (err.ok() && !uri_.parse(dsn)) { - err = Error(errNotValid, "Cannot connect to DB: Not a valid uri"); - } - if (err.ok()) err = db().Connect(dsn, std::forward(args)...); - if (err.ok()) { - loop_.spawn( - [this] { - // This coroutine should prevent loop from stopping for core::Reindexer - stopCh_.pop(); - }, - k8KStack); - } - std::lock_guard lck(mtx_); - status_.running = err.ok(); - status_.err = std::move(err); - }; - loop_.spawn(std::bind(fn, std::cref(dsn), std::forward(args)...)); + loop_.spawn(std::bind(fnLoop, std::cref(dsn), std::forward(args)...)); loop_.run(); }; setStatus(Status()); - executorThr_ = std::thread(std::bind(fn, std::cref(dsn), std::forward(args)...)); + executorThr_ = std::thread(std::bind(fnThread, std::cref(dsn), std::forward(args)...)); auto status = GetStatus(); while (!status.running && status.err.ok()) { std::this_thread::sleep_for(std::chrono::milliseconds(1)); diff --git a/cpp_src/core/defnsconfigs.h b/cpp_src/core/defnsconfigs.h index 04fec8aa3..1601c2b68 100644 --- a/cpp_src/core/defnsconfigs.h +++ b/cpp_src/core/defnsconfigs.h @@ -75,6 +75,7 @@ const std::vector kDefDBConfig = { "replication":{ "role":"none", "master_dsn":"cproto://127.0.0.1:6534/db", + "server_id":0, "cluster_id":2, "force_sync_on_logic_error": false, "force_sync_on_wrong_data_hash": false, diff --git a/cpp_src/core/ft/areaholder.h b/cpp_src/core/ft/areaholder.h index e4db54a9f..fb186f6b0 100644 --- a/cpp_src/core/ft/areaholder.h +++ b/cpp_src/core/ft/areaholder.h @@ -39,7 +39,8 @@ class AreaBuffer { [[nodiscard]] bool Empty() const noexcept { return data_.empty(); } void Commit() { if (!data_.empty()) { - boost::sort::pdqsort(data_.begin(), data_.end(), [](const Area &rhs, const Area &lhs) { return rhs.start < lhs.start; }); + boost::sort::pdqsort_branchless(data_.begin(), data_.end(), + [](const Area &rhs, const Area &lhs) noexcept { return rhs.start < lhs.start; }); for (auto vit = data_.begin() + 1; vit != data_.end(); ++vit) { auto prev = vit - 1; if (vit->Concat(*prev)) { diff --git a/cpp_src/core/ft/ft_fast/selecter.cc b/cpp_src/core/ft/ft_fast/selecter.cc index b460ca929..40082ae17 100644 --- a/cpp_src/core/ft/ft_fast/selecter.cc +++ b/cpp_src/core/ft/ft_fast/selecter.cc @@ -335,8 +335,8 @@ void Selecter::processLowRelVariants(FtSelectContext& ctx, const FtMerge return false; }); } else { - boost::sort::pdqsort(ctx.lowRelVariants.begin(), ctx.lowRelVariants.end(), - [](FtBoundVariantEntry& l, FtBoundVariantEntry& r) noexcept { return l.proc > r.proc; }); + boost::sort::pdqsort_branchless(ctx.lowRelVariants.begin(), ctx.lowRelVariants.end(), + [](FtBoundVariantEntry& l, FtBoundVariantEntry& r) noexcept { return l.proc > r.proc; }); } auto lastVariantLen = ctx.lowRelVariants.size() ? ctx.lowRelVariants[0].GetLenCached() : -1; @@ -790,7 +790,7 @@ std::pair Selecter::calcTermRank(const TextSearchResults& r if (!termRank) return std::make_pair(termRank, field); if (holder_.cfg_->summationRanksByFieldsRatio > 0) { - std::sort(ranksInFields.begin(), ranksInFields.end()); + boost::sort::pdqsort_branchless(ranksInFields.begin(), ranksInFields.end()); double k = holder_.cfg_->summationRanksByFieldsRatio; for (auto rank : ranksInFields) { termRank += (k * rank); @@ -921,9 +921,10 @@ void Selecter::mergeIterationGroup(TextSearchResults& rawRes, index_t ra mergedPosInfo.rank = 0; } else { auto& posTmp = mergedPosInfo.posTmp; - boost::sort::pdqsort( - posTmp.begin(), posTmp.end(), - [](const std::pair& l, const std::pair& r) { return l.first < r.first; }); + boost::sort::pdqsort_branchless(posTmp.begin(), posTmp.end(), + [](const std::pair& l, + const std::pair& r) noexcept { return l.first < r.first; }); + auto last = std::unique(posTmp.begin(), posTmp.end()); posTmp.resize(last - posTmp.begin()); @@ -984,9 +985,9 @@ void Selecter::mergeResultsPart(std::vector& rawResul merged.maxRank = m.proc; } } - - boost::sort::pdqsort(merged.begin(), merged.end(), - [](const IDataHolder::MergeInfo& lhs, const IDataHolder::MergeInfo& rhs) { return lhs.proc > rhs.proc; }); + boost::sort::pdqsort_branchless( + merged.begin(), merged.end(), + [](const IDataHolder::MergeInfo& lhs, const IDataHolder::MergeInfo& rhs) noexcept { return lhs.proc > rhs.proc; }); } template @@ -1244,12 +1245,11 @@ typename IDataHolder::MergeData Selecter::mergeResults(std::vector merged_rd; std::vector idoffsets; - for (auto& rawRes : rawResults) { - boost::sort::pdqsort(rawRes.begin(), rawRes.end(), - [](const TextSearchResult& lhs, const TextSearchResult& rhs) { return lhs.proc_ > rhs.proc_; }); + boost::sort::pdqsort_branchless( + rawRes.begin(), rawRes.end(), + [](const TextSearchResult& lhs, const TextSearchResult& rhs) noexcept { return lhs.proc_ > rhs.proc_; }); } - const auto maxMergedSize = std::min(size_t(holder_.cfg_->mergeLimit), totalORVids); merged.reserve(maxMergedSize); @@ -1332,8 +1332,9 @@ typename IDataHolder::MergeData Selecter::mergeResults(std::vector rhs.proc; }); + boost::sort::pdqsort_branchless( + merged.begin(), merged.end(), + [](const IDataHolder::MergeInfo& lhs, const IDataHolder::MergeInfo& rhs) noexcept { return lhs.proc > rhs.proc; }); return merged; } diff --git a/cpp_src/core/ft/ft_fuzzy/merger/basemerger.cc b/cpp_src/core/ft/ft_fuzzy/merger/basemerger.cc index 967161001..12a57498c 100644 --- a/cpp_src/core/ft/ft_fuzzy/merger/basemerger.cc +++ b/cpp_src/core/ft/ft_fuzzy/merger/basemerger.cc @@ -93,7 +93,7 @@ SearchResult BaseMerger::Merge(MergeCtx& ctx, bool inTransaction, const reindexe data_set.AddData(it->Id(), id_ctx); } } - boost::sort::pdqsort(data_set.data_->begin(), data_set.data_->end(), [](const MergedData& lhs, const MergedData& rhs) { + boost::sort::pdqsort(data_set.data_->begin(), data_set.data_->end(), [](const MergedData& lhs, const MergedData& rhs) noexcept { if (lhs.proc_ == rhs.proc_) { return lhs.id_ < rhs.id_; } diff --git a/cpp_src/core/ft/idrelset.cc b/cpp_src/core/ft/idrelset.cc index 7f31546d1..6b87bc15c 100644 --- a/cpp_src/core/ft/idrelset.cc +++ b/cpp_src/core/ft/idrelset.cc @@ -1,4 +1,3 @@ - #include "idrelset.h" #include #include "estl/h_vector.h" @@ -84,9 +83,4 @@ int IdRelSet::Add(VDocIdType id, int pos, int field) { return back().Size(); } -void IdRelType::SimpleCommit() { - boost::sort::pdqsort(pos_.begin(), pos_.end(), - [](const IdRelType::PosType& lhs, const IdRelType::PosType& rhs) { return lhs.pos() < rhs.pos(); }); -} - } // namespace reindexer diff --git a/cpp_src/core/ft/idrelset.h b/cpp_src/core/ft/idrelset.h index 05ea5f8b7..23bc811fa 100644 --- a/cpp_src/core/ft/idrelset.h +++ b/cpp_src/core/ft/idrelset.h @@ -102,11 +102,11 @@ class IdRelType { addField(field); } void SortAndUnique() { - boost::sort::pdqsort(pos_.begin(), pos_.end()); + boost::sort::pdqsort_branchless(pos_.begin(), pos_.end()); auto last = std::unique(pos_.begin(), pos_.end()); pos_.resize(last - pos_.begin()); } - void Clear() { + void Clear() noexcept { usedFieldsMask_ = 0; #ifdef REINDEXER_FT_EXTRA_DEBUG pos_.clear(); @@ -116,7 +116,11 @@ class IdRelType { } size_t Size() const noexcept { return pos_.size(); } size_t size() const noexcept { return pos_.size(); } - void SimpleCommit(); + void SimpleCommit() noexcept { + boost::sort::pdqsort_branchless( + pos_.begin(), pos_.end(), + [](const IdRelType::PosType& lhs, const IdRelType::PosType& rhs) noexcept { return lhs.pos() < rhs.pos(); }); + } const RVector& Pos() const noexcept { return pos_; } uint64_t UsedFieldsMask() const noexcept { return usedFieldsMask_; } size_t HeapSize() const noexcept { return heapSize(pos_); } @@ -141,7 +145,7 @@ class IdRelType { class IdRelSet : public std::vector { public: int Add(VDocIdType id, int pos, int field); - void SimpleCommit() { + void SimpleCommit() noexcept { for (auto& val : *this) val.SimpleCommit(); } diff --git a/cpp_src/core/idset.h b/cpp_src/core/idset.h index 81522fcef..e2e501c00 100644 --- a/cpp_src/core/idset.h +++ b/cpp_src/core/idset.h @@ -108,7 +108,7 @@ class IdSet : public IdSetPlain { return *this; } static Ptr BuildFromUnsorted(base_idset &&ids) { - boost::sort::pdqsort(ids.begin(), ids.end()); + boost::sort::pdqsort_branchless(ids.begin(), ids.end()); ids.erase(std::unique(ids.begin(), ids.end()), ids.end()); // TODO: It would be better to integrate unique into sort return make_intrusive>(std::move(ids)); } diff --git a/cpp_src/core/index/indextext/fastindextext.cc b/cpp_src/core/index/indextext/fastindextext.cc index 12cbdcae9..c56dc44b8 100644 --- a/cpp_src/core/index/indextext/fastindextext.cc +++ b/cpp_src/core/index/indextext/fastindextext.cc @@ -123,7 +123,7 @@ template IndexMemStat FastIndexText::GetMemStat(const RdxContext &ctx) { auto ret = IndexUnordered::GetMemStat(ctx); - contexted_shared_lock lck(this->mtx_, &ctx); + contexted_shared_lock lck(this->mtx_, ctx); ret.fulltextSize = this->holder_->GetMemStat(); ret.idsetCache = this->cache_ft_ ? this->cache_ft_->GetMemStat() : LRUCacheMemStat(); return ret; diff --git a/cpp_src/core/index/keyentry.h b/cpp_src/core/index/keyentry.h index 079f543c6..9c500dba1 100644 --- a/cpp_src/core/index/keyentry.h +++ b/cpp_src/core/index/keyentry.h @@ -33,12 +33,14 @@ class KeyEntry { auto idsAsc = Sorted(ctx.getCurSortId()); size_t idx = 0; + const auto& ids2Sorts = ctx.ids2Sorts(); + [[maybe_unused]] const IdType maxRowId = IdType(ids2Sorts.size()); // For all ids of current key for (auto rowid : ids_) { - assertf(rowid < int(ctx.ids2Sorts().size()), "id=%d,ctx.ids2Sorts().size()=%d", rowid, ctx.ids2Sorts().size()); - idsAsc[idx++] = ctx.ids2Sorts()[rowid]; + assertf(rowid < maxRowId, "id=%d,ctx.ids2Sorts().size()=%d", rowid, maxRowId); + idsAsc[idx++] = ids2Sorts[rowid]; } - boost::sort::pdqsort(idsAsc.begin(), idsAsc.end()); + boost::sort::pdqsort_branchless(idsAsc.begin(), idsAsc.end()); } void Dump(std::ostream& os, std::string_view step, std::string_view offset) const { std::string newOffset; diff --git a/cpp_src/core/index/rtree/greenesplitter.h b/cpp_src/core/index/rtree/greenesplitter.h index ba707e781..c8c6a7179 100644 --- a/cpp_src/core/index/rtree/greenesplitter.h +++ b/cpp_src/core/index/rtree/greenesplitter.h @@ -1,6 +1,7 @@ #pragma once #include "splitter.h" +#include "vendor/sort/pdqsort.hpp" namespace reindexer { @@ -53,7 +54,7 @@ class GreeneSplitter : private Splitter secondSeedBoundRect.Left() + secondSeedBoundRect.Right()) { std::swap(seeds.first, seeds.second); } - std::sort(std::begin(indexes), std::end(indexes), [&src, this](size_t lhs, size_t rhs) { + boost::sort::pdqsort(std::begin(indexes), std::end(indexes), [&src, this](size_t lhs, size_t rhs) { return Base::getBoundRect(lhs < MaxEntries ? src[lhs] : this->appendingEntry_).Left() < Base::getBoundRect(rhs < MaxEntries ? src[rhs] : this->appendingEntry_).Left(); }); @@ -61,7 +62,7 @@ class GreeneSplitter : private Splitter secondSeedBoundRect.Bottom() + secondSeedBoundRect.Top()) { std::swap(seeds.first, seeds.second); } - std::sort(std::begin(indexes), std::end(indexes), [&src, this](size_t lhs, size_t rhs) { + boost::sort::pdqsort(std::begin(indexes), std::end(indexes), [&src, this](size_t lhs, size_t rhs) { return Base::getBoundRect(lhs < MaxEntries ? src[lhs] : this->appendingEntry_).Bottom() < Base::getBoundRect(rhs < MaxEntries ? src[rhs] : this->appendingEntry_).Bottom(); }); diff --git a/cpp_src/core/index/rtree/rstarsplitter.h b/cpp_src/core/index/rtree/rstarsplitter.h index a44c9748e..427a4add3 100644 --- a/cpp_src/core/index/rtree/rstarsplitter.h +++ b/cpp_src/core/index/rtree/rstarsplitter.h @@ -1,6 +1,7 @@ #pragma once #include "splitter.h" +#include "vendor/sort/pdqsort.hpp" namespace reindexer { @@ -19,12 +20,12 @@ class RStarSplitter : private Splitter diff --git a/cpp_src/core/lsn.cc b/cpp_src/core/lsn.cc index dc88fb059..73c0130e2 100644 --- a/cpp_src/core/lsn.cc +++ b/cpp_src/core/lsn.cc @@ -3,9 +3,11 @@ namespace reindexer { -void lsn_t::GetJSON(JsonBuilder &builder) const { +void lsn_t::GetJSON(JsonBuilder& builder) const { builder.Put("server_id", Server()); builder.Put("counter", Counter()); } -} // namespace reindexer +[[noreturn]] void lsn_t::throwValidation(ErrorCode code, const char* fmt, int64_t value) { throw Error(code, fmt, value); } + +} // namespace reindexer \ No newline at end of file diff --git a/cpp_src/core/lsn.h b/cpp_src/core/lsn.h index eb1f83d15..174540da4 100644 --- a/cpp_src/core/lsn.h +++ b/cpp_src/core/lsn.h @@ -13,58 +13,53 @@ class JsonBuilder; // SSS NNN NNN NNN NNN NNN (18 decimal digits) struct lsn_t { - static const int64_t digitCountLSNMult = 1000000000000000ll; +private: + static constexpr int16_t kMinServerIDValue = 0; + static constexpr int16_t kMaxServerIDValue = 999; - static const int64_t kCounterbitCount = 48; - static const int64_t kCounterMask = (1ull << kCounterbitCount) - 1ull; + static constexpr int64_t kMaxCounter = 1000000000000000ll; + static constexpr int64_t kDefaultCounter = kMaxCounter - 1; +public: void GetJSON(JsonBuilder &builder) const; void FromJSON(const gason::JsonNode &root) { - int server = root["server_id"].As(0); - int64_t counter = root["counter"].As(digitCountLSNMult - 1ll); + const int server = root["server_id"].As(0); + const int64_t counter = root["counter"].As(kDefaultCounter); payload_ = int64_t(lsn_t(counter, server)); } - lsn_t() {} - explicit lsn_t(int64_t v) { - if ((v & kCounterMask) == kCounterMask) // init -1 - payload_ = digitCountLSNMult - 1ll; - else { - payload_ = v; - } - } - lsn_t(int64_t counter, uint8_t server) { - if ((counter & kCounterMask) == kCounterMask) counter = digitCountLSNMult - 1ll; - int64_t s = server * digitCountLSNMult; - payload_ = s + counter; + lsn_t() noexcept = default; + lsn_t(const lsn_t &) noexcept = default; + lsn_t(lsn_t &&) noexcept = default; + lsn_t &operator=(const lsn_t &) noexcept = default; + lsn_t &operator=(lsn_t &&) noexcept = default; + explicit lsn_t(int64_t v) : lsn_t(v % kMaxCounter, v / kMaxCounter) {} + lsn_t(int64_t counter, int16_t server) { + validateCounter(counter); + validateServerId(server); + payload_ = server * kMaxCounter + counter; } explicit operator int64_t() const { return payload_; } - bool operator==(lsn_t o) { return payload_ == o.payload_; } - bool operator!=(lsn_t o) { return payload_ != o.payload_; } + bool operator==(lsn_t o) const noexcept { return payload_ == o.payload_; } + bool operator!=(lsn_t o) const noexcept { return payload_ != o.payload_; } - int64_t SetServer(short s) { - if (s > 999) throw Error(errLogic, "Server id > 999"); - int64_t server = s * digitCountLSNMult; - int64_t serverOld = payload_ / digitCountLSNMult; - payload_ = payload_ - serverOld * digitCountLSNMult + server; + int64_t SetServer(short server) { + validateServerId(server); + payload_ = server * kMaxCounter + Counter(); return payload_; } - int64_t SetCounter(int64_t c) { - if (c >= digitCountLSNMult) throw Error(errLogic, "LSN Counter > digitCountLSNMult"); - int64_t server = payload_ / digitCountLSNMult; - payload_ = server * digitCountLSNMult + c; + int64_t SetCounter(int64_t counter) { + validateCounter(counter); + payload_ = Server() * kMaxCounter + counter; return payload_; } - int64_t Counter() const { - int64_t server = payload_ / digitCountLSNMult; - return payload_ - server * digitCountLSNMult; - } - short Server() const { return payload_ / digitCountLSNMult; } - bool isEmpty() const { return Counter() == digitCountLSNMult - 1ll; } + int64_t Counter() const noexcept { return payload_ % kMaxCounter; } + int16_t Server() const noexcept { return payload_ / kMaxCounter; } + bool isEmpty() const noexcept { return Counter() == kDefaultCounter; } - int compare(lsn_t o) { + int compare(lsn_t o) const { if (Server() != o.Server()) throw Error(errLogic, "Compare lsn from different server"); if (Counter() < o.Counter()) return -1; @@ -73,13 +68,28 @@ struct lsn_t { return 0; } - bool operator<(lsn_t o) { return compare(o) == -1; } - bool operator<=(lsn_t o) { return compare(o) <= 0; } - bool operator>(lsn_t o) { return compare(o) == 1; } - bool operator>=(lsn_t o) { return compare(o) >= 0; } + bool operator<(lsn_t o) const { return compare(o) == -1; } + bool operator<=(lsn_t o) const { return compare(o) <= 0; } + bool operator>(lsn_t o) const { return compare(o) == 1; } + bool operator>=(lsn_t o) const { return compare(o) >= 0; } + +private: + int64_t payload_ = kDefaultCounter; + static void validateServerId(int16_t server) { + if (server < kMinServerIDValue) { + throwValidation(errLogic, "Server id < %d", kMinServerIDValue); + } + if (server > kMaxServerIDValue) { + throwValidation(errLogic, "Server id > %d", kMaxServerIDValue); + } + } + static void validateCounter(int64_t counter) { + if (counter > kDefaultCounter) { + throwValidation(errLogic, "LSN Counter > Default LSN (%d)", kMaxCounter); + } + } -protected: - int64_t payload_ = digitCountLSNMult - 1ll; + [[noreturn]] static void throwValidation(ErrorCode, const char *, int64_t); }; struct LSNPair { diff --git a/cpp_src/core/namespace/namespace.cc b/cpp_src/core/namespace/namespace.cc index 733bb309e..dbf0cc362 100644 --- a/cpp_src/core/namespace/namespace.cc +++ b/cpp_src/core/namespace/namespace.cc @@ -23,7 +23,7 @@ void Namespace::CommitTransaction(Transaction& tx, QueryResults& result, const R if (needNamespaceCopy(nsl, tx)) { PerfStatCalculatorMT calc(nsl->updatePerfCounter_, enablePerfCounters); - auto lck = statCalculator.CreateLock(clonerMtx_, &ctx); + auto lck = statCalculator.CreateLock(clonerMtx_, ctx); nsl = ns_; if (needNamespaceCopy(nsl, tx)) { diff --git a/cpp_src/core/namespace/namespace.h b/cpp_src/core/namespace/namespace.h index 55dc59548..710beea52 100644 --- a/cpp_src/core/namespace/namespace.h +++ b/cpp_src/core/namespace/namespace.h @@ -160,7 +160,7 @@ class Namespace { NamespaceImpl::Ptr getMainNs() const { return atomicLoadMainNs(); } NamespaceImpl::Ptr awaitMainNs(const RdxContext &ctx) const { if (hasCopy_.load(std::memory_order_acquire)) { - contexted_unique_lock lck(clonerMtx_, &ctx); + contexted_unique_lock lck(clonerMtx_, ctx); assertrx(!hasCopy_.load(std::memory_order_acquire)); return ns_; } diff --git a/cpp_src/core/namespace/namespaceimpl.h b/cpp_src/core/namespace/namespaceimpl.h index 31a6e8fb4..b09d79486 100644 --- a/cpp_src/core/namespace/namespaceimpl.h +++ b/cpp_src/core/namespace/namespaceimpl.h @@ -138,7 +138,7 @@ class NamespaceImpl : public intrusive_atomic_rc_base { // NOLINT(*performance. friend class ItemsLoader; friend class IndexInserters; - class NSUpdateSortedContext : public UpdateSortedContext { + class NSUpdateSortedContext final : public UpdateSortedContext { public: NSUpdateSortedContext(const NamespaceImpl &ns, SortType curSortId) : ns_(ns), sorted_indexes_(ns_.getSortedIdxCount()), curSortId_(curSortId) { @@ -303,10 +303,10 @@ class NamespaceImpl : public intrusive_atomic_rc_base { // NOLINT(*performance. typedef contexted_shared_lock RLockT; typedef contexted_unique_lock WLockT; - RLockT RLock(const RdxContext &ctx) const { return RLockT(mtx_, &ctx); } + RLockT RLock(const RdxContext &ctx) const { return RLockT(mtx_, ctx); } WLockT WLock(const RdxContext &ctx) const { using namespace std::string_view_literals; - WLockT lck(mtx_, &ctx); + WLockT lck(mtx_, ctx); if (readonly_.load(std::memory_order_acquire)) { throw Error(errNamespaceInvalidated, "NS invalidated"sv); } diff --git a/cpp_src/core/nsselecter/querypreprocessor.cc b/cpp_src/core/nsselecter/querypreprocessor.cc index 6070eb478..6697aad44 100644 --- a/cpp_src/core/nsselecter/querypreprocessor.cc +++ b/cpp_src/core/nsselecter/querypreprocessor.cc @@ -501,7 +501,7 @@ bool QueryPreprocessor::mergeQueryEntries(size_t lhs, size_t rhs) { constexpr size_t kMinArraySizeToUseHashSet = 250; if (second.size() < kMinArraySizeToUseHashSet) { // Intersect via binary search + sort for small vectors - std::sort(first.begin(), first.end()); + boost::sort::pdqsort(first.begin(), first.end()); for (auto &&v : second) { if (std::binary_search(first.begin(), first.end(), v)) { setValues.emplace_back(std::move(v)); diff --git a/cpp_src/core/reindexerimpl.cc b/cpp_src/core/reindexerimpl.cc index 59e1f48bd..5b1040f6c 100644 --- a/cpp_src/core/reindexerimpl.cc +++ b/cpp_src/core/reindexerimpl.cc @@ -96,7 +96,7 @@ ReindexerImpl::StatsLocker::StatsLocker() { ReindexerImpl::StatsLocker::StatsLockT ReindexerImpl::StatsLocker::LockIfRequired(std::string_view sysNsName, const RdxContext& ctx) { auto found = mtxMap_.find(sysNsName); if (found != mtxMap_.end()) { - return StatsLockT(found->second, &ctx); + return StatsLockT(found->second, ctx); } // Do not create any lock, if namespace does not preset in the map return StatsLockT(); @@ -231,8 +231,9 @@ Error ReindexerImpl::Connect(const std::string& dsn, ConnectOpts opts) { if (!err.ok()) return err; if (enableStorage && opts.IsOpenNamespaces()) { - std::sort(foundNs.begin(), foundNs.end(), - [](const fs::DirEntry& ld, const fs::DirEntry& rd) { return ld.internalFilesCount > rd.internalFilesCount; }); + boost::sort::pdqsort_branchless(foundNs.begin(), foundNs.end(), [](const fs::DirEntry& ld, const fs::DirEntry& rd) noexcept { + return ld.internalFilesCount > rd.internalFilesCount; + }); const size_t maxLoadWorkers = ConcurrentNamespaceLoaders(); std::unique_ptr thrs(new std::thread[maxLoadWorkers]); std::atomic_flag hasNsErrors = ATOMIC_FLAG_INIT; @@ -303,7 +304,7 @@ Error ReindexerImpl::OpenNamespace(std::string_view nsName, const StorageOpts& o const auto rdxCtx = ctx.CreateRdxContext(ctx.NeedTraceActivity() ? (ser << "OPEN NAMESPACE " << nsName).Slice() : ""sv, activities_); { - SLock lock(mtx_, &rdxCtx); + SLock lock(mtx_, rdxCtx); auto it = namespaces_.find(nsName); if (it == namespaces_.end()) { // create new namespace if (!validateUserNsName(nsName)) { @@ -335,7 +336,7 @@ Error ReindexerImpl::addNamespace(const NamespaceDef& nsDef, const RdxContext& r Namespace::Ptr ns; try { { - SLock lock(mtx_, &rdxCtx); + SLock lock(mtx_, rdxCtx); if (namespaces_.find(nsDef.name) != namespaces_.end()) { return Error(errParams, "Namespace '%s' already exists", nsDef.name); } @@ -356,7 +357,7 @@ Error ReindexerImpl::addNamespace(const NamespaceDef& nsDef, const RdxContext& r ns->LoadFromStorage(kStorageLoadingThreads, rdxCtx); } { - ULock lock(mtx_, &rdxCtx); + ULock lock(mtx_, rdxCtx); namespaces_.insert({nsDef.name, ns}); } if (!nsDef.isTemporary) observers_.OnWALUpdate(LSNPair(), nsDef.name, WALRecord(WalNamespaceAdd)); @@ -376,7 +377,7 @@ Error ReindexerImpl::addNamespace(const NamespaceDef& nsDef, const RdxContext& r Error ReindexerImpl::openNamespace(std::string_view name, const StorageOpts& storageOpts, const RdxContext& rdxCtx) { try { { - SLock lock(mtx_, &rdxCtx); + SLock lock(mtx_, rdxCtx); auto nsIt = namespaces_.find(name); if (nsIt != namespaces_.end() && nsIt->second) { if (storageOpts.IsSlaveMode()) nsIt->second->setSlaveMode(rdxCtx); @@ -426,7 +427,7 @@ Error ReindexerImpl::closeNamespace(std::string_view nsName, const RdxContext& c Namespace::Ptr ns; Error err; try { - ULock lock(mtx_, &ctx); + ULock lock(mtx_, ctx); auto nsIt = namespaces_.find(nsName); if (nsIt == namespaces_.end()) { return Error(errNotFound, "Namespace '%s' does not exist", nsName); @@ -498,7 +499,7 @@ Error ReindexerImpl::RenameNamespace(std::string_view srcNsName, const std::stri const auto rdxCtx = ctx.CreateRdxContext( ctx.NeedTraceActivity() ? (ser << "RENAME " << srcNsName << " to " << dstNsName).Slice() : ""sv, activities_); { - SLock lock(mtx_, &rdxCtx); + SLock lock(mtx_, rdxCtx); auto srcIt = namespaces_.find(srcNsName); if (srcIt == namespaces_.end()) { return Error(errParams, "Namespace '%s' doesn't exist", srcNsName); @@ -540,7 +541,7 @@ Error ReindexerImpl::renameNamespace(std::string_view srcNsName, const std::stri { // Perform namespace flushes to minimize chances of the flush under lock - SLock lock(mtx_, &rdxCtx); + SLock lock(mtx_, rdxCtx); auto srcIt = namespaces_.find(srcNsName); srcNs = (srcIt != namespaces_.end()) ? srcIt->second : Namespace::Ptr(); lock.unlock(); @@ -554,7 +555,7 @@ Error ReindexerImpl::renameNamespace(std::string_view srcNsName, const std::stri } } - ULock lock(mtx_, &rdxCtx); + ULock lock(mtx_, rdxCtx); auto srcIt = namespaces_.find(srcNsName); if (srcIt == namespaces_.end()) { return Error(errParams, "Namespace '%s' doesn't exist", srcNsName); @@ -837,7 +838,7 @@ Error ReindexerImpl::Select(std::string_view query, QueryResults& result, const } struct ItemRefLess { - bool operator()(const ItemRef& lhs, const ItemRef& rhs) const { + bool operator()(const ItemRef& lhs, const ItemRef& rhs) const noexcept { if (lhs.Proc() == rhs.Proc()) { if (lhs.Nsid() == rhs.Nsid()) { return lhs.Id() < rhs.Id(); @@ -1200,7 +1201,7 @@ void ReindexerImpl::doSelect(const Query& q, QueryResults& result, NsLocker& result.Erase(itemRefVec.begin(), itemRefVec.end()); return; } - std::sort(itemRefVec.begin(), itemRefVec.end(), ItemRefLess()); + boost::sort::pdqsort(itemRefVec.begin(), itemRefVec.end(), ItemRefLess()); if (q.HasOffset()) { result.Erase(itemRefVec.begin(), itemRefVec.begin() + q.Offset()); } @@ -1224,7 +1225,7 @@ Error ReindexerImpl::Commit(std::string_view /*_namespace*/) { } Namespace::Ptr ReindexerImpl::getNamespace(std::string_view nsName, const RdxContext& ctx) { - SLock lock(mtx_, &ctx); + SLock lock(mtx_, ctx); auto nsIt = namespaces_.find(nsName); if (nsIt == namespaces_.end()) { throw Error(errParams, "Namespace '%s' does not exist", nsName); @@ -1235,7 +1236,7 @@ Namespace::Ptr ReindexerImpl::getNamespace(std::string_view nsName, const RdxCon } Namespace::Ptr ReindexerImpl::getNamespaceNoThrow(std::string_view nsName, const RdxContext& ctx) { - SLock lock(mtx_, &ctx); + SLock lock(mtx_, ctx); auto nsIt = namespaces_.find(nsName); return (nsIt == namespaces_.end()) ? nullptr : nsIt->second; } @@ -1279,7 +1280,7 @@ Error ReindexerImpl::DropIndex(std::string_view nsName, const IndexDef& indexDef } std::vector> ReindexerImpl::getNamespaces(const RdxContext& ctx) { - SLock lock(mtx_, &ctx); + SLock lock(mtx_, ctx); std::vector> ret; ret.reserve(namespaces_.size()); for (auto& ns : namespaces_) { @@ -1290,7 +1291,7 @@ std::vector> ReindexerImpl::getNamespaces std::vector ReindexerImpl::getNamespacesNames(const RdxContext& ctx) { std::vector ret; - SLock lock(mtx_, &ctx); + SLock lock(mtx_, ctx); ret.reserve(namespaces_.size()); for (auto& ns : namespaces_) { ret.emplace_back(); @@ -1322,7 +1323,7 @@ Error ReindexerImpl::EnumNamespaces(std::vector& defs, EnumNamespa for (auto& d : dirs) { if (d.isDir && d.name != "." && d.name != ".." && opts.MatchFilter(d.name)) { { - SLock lock(mtx_, &rdxCtx); + SLock lock(mtx_, rdxCtx); if (namespaces_.find(d.name) != namespaces_.end()) continue; } std::unique_ptr tmpNs{new NamespaceImpl(d.name, observers_)}; diff --git a/cpp_src/core/reindexerimpl.h b/cpp_src/core/reindexerimpl.h index f8ef5736d..d5ff74fbd 100644 --- a/cpp_src/core/reindexerimpl.h +++ b/cpp_src/core/reindexerimpl.h @@ -31,7 +31,7 @@ class ReindexerImpl { using Mutex = MarkedMutex; using StatsSelectMutex = MarkedMutex; struct NsLockerItem { - NsLockerItem(NamespaceImpl::Ptr ins = {}) : ns(std::move(ins)), count(1) {} + NsLockerItem(NamespaceImpl::Ptr ins = {}) noexcept : ns(std::move(ins)), count(1) {} NamespaceImpl::Ptr ns; NamespaceImpl::Locker::RLockT nsLck; unsigned count = 1; @@ -144,8 +144,9 @@ class ReindexerImpl { assertrx(0); } void Lock() { - std::sort(begin(), end(), [](const NsLockerItem &lhs, const NsLockerItem &rhs) { return lhs.ns.get() < rhs.ns.get(); }); - for (auto it = begin(); it != end(); ++it) { + boost::sort::pdqsort_branchless( + begin(), end(), [](const NsLockerItem &lhs, const NsLockerItem &rhs) noexcept { return lhs.ns.get() < rhs.ns.get(); }); + for (auto it = begin(), e = end(); it != e; ++it) { it->nsLck = it->ns->rLock(context_); } locked_ = true; diff --git a/cpp_src/estl/contexted_locks.h b/cpp_src/estl/contexted_locks.h index ba8dc9045..2e60b0ec8 100644 --- a/cpp_src/estl/contexted_locks.h +++ b/cpp_src/estl/contexted_locks.h @@ -13,32 +13,27 @@ using std::adopt_lock_t; namespace reindexer { -const milliseconds kDefaultCondChkTime = milliseconds(20); +constexpr milliseconds kDefaultCondChkTime = milliseconds(20); template class contexted_unique_lock { public: using MutexType = _Mutex; - explicit contexted_unique_lock() : _M_mtx(nullptr), _M_owns(false), _M_context(nullptr), _M_chkTimeout(kDefaultCondChkTime) {} - explicit contexted_unique_lock(MutexType& __mtx, Context* __context, milliseconds __chkTimeout = kDefaultCondChkTime) - : _M_mtx(&__mtx), _M_owns(false), _M_context(__context), _M_chkTimeout(__chkTimeout) { - assertrx(_M_context); + explicit contexted_unique_lock() noexcept : _M_mtx(nullptr), _M_owns(false), _M_context(nullptr), _M_chkTimeout(kDefaultCondChkTime) {} + explicit contexted_unique_lock(MutexType& __mtx, Context& __context, milliseconds __chkTimeout = kDefaultCondChkTime) + : _M_mtx(&__mtx), _M_owns(false), _M_context(&__context), _M_chkTimeout(__chkTimeout) { lock(); } - explicit contexted_unique_lock(MutexType& __mtx, defer_lock_t, Context* __context, milliseconds __chkTimeout = kDefaultCondChkTime) - : _M_mtx(&__mtx), _M_owns(false), _M_context(__context), _M_chkTimeout(__chkTimeout) { - assertrx(_M_context); - } - explicit contexted_unique_lock(MutexType& __mtx, adopt_lock_t, Context* __context, milliseconds __chkTimeout = kDefaultCondChkTime) - : _M_mtx(&__mtx), _M_owns(true), _M_context(__context), _M_chkTimeout(__chkTimeout) { - assertrx(_M_context); - } - explicit contexted_unique_lock(MutexType& __mtx, try_to_lock_t, Context* __context, milliseconds __chkTimeout = kDefaultCondChkTime) - : _M_mtx(&__mtx), _M_owns(__mtx.try_lock()), _M_context(__context), _M_chkTimeout(__chkTimeout) { - assertrx(_M_context); - } - contexted_unique_lock(contexted_unique_lock&& lck) + explicit contexted_unique_lock(MutexType& __mtx, defer_lock_t, Context& __context, + milliseconds __chkTimeout = kDefaultCondChkTime) noexcept + : _M_mtx(&__mtx), _M_owns(false), _M_context(&__context), _M_chkTimeout(__chkTimeout) {} + explicit contexted_unique_lock(MutexType& __mtx, adopt_lock_t, Context& __context, + milliseconds __chkTimeout = kDefaultCondChkTime) noexcept + : _M_mtx(&__mtx), _M_owns(true), _M_context(&__context), _M_chkTimeout(__chkTimeout) {} + explicit contexted_unique_lock(MutexType& __mtx, try_to_lock_t, Context& __context, milliseconds __chkTimeout = kDefaultCondChkTime) + : _M_mtx(&__mtx), _M_owns(__mtx.try_lock()), _M_context(&__context), _M_chkTimeout(__chkTimeout) {} + contexted_unique_lock(contexted_unique_lock&& lck) noexcept : _M_mtx(lck._M_mtx), _M_owns(lck._M_owns), _M_context(lck._M_context), _M_chkTimeout(lck._M_chkTimeout) { lck._M_owns = false; lck._M_mtx = nullptr; @@ -50,7 +45,7 @@ class contexted_unique_lock { contexted_unique_lock(const contexted_unique_lock&) = delete; contexted_unique_lock& operator=(const contexted_unique_lock&) = delete; - contexted_unique_lock& operator=(contexted_unique_lock&& lck) { + contexted_unique_lock& operator=(contexted_unique_lock&& lck) noexcept { if (this != &lck) { if (_M_owns) unlock(); _M_mtx = lck._M_mtx; @@ -102,7 +97,7 @@ class contexted_unique_lock { MutexType* mutex() const noexcept { return _M_mtx; } private: - void _M_lockable() const { + void _M_lockable() const noexcept { if (_M_mtx == nullptr) assertrx(0); if (_M_owns) assertrx(0); } @@ -118,21 +113,17 @@ class contexted_shared_lock { public: using MutexType = _Mutex; - explicit contexted_shared_lock() : _M_mtx(nullptr), _M_owns(false), _M_context(nullptr), _M_chkTimeout(kDefaultCondChkTime) {} - explicit contexted_shared_lock(MutexType& __mtx, Context* __context, milliseconds __chkTimeout = kDefaultCondChkTime) - : _M_mtx(&__mtx), _M_owns(false), _M_context(__context), _M_chkTimeout(__chkTimeout) { - assertrx(_M_context); + explicit contexted_shared_lock() noexcept : _M_mtx(nullptr), _M_owns(false), _M_context(nullptr), _M_chkTimeout(kDefaultCondChkTime) {} + explicit contexted_shared_lock(MutexType& __mtx, Context& __context, milliseconds __chkTimeout = kDefaultCondChkTime) + : _M_mtx(&__mtx), _M_owns(false), _M_context(&__context), _M_chkTimeout(__chkTimeout) { lock(); } - explicit contexted_shared_lock(MutexType& __mtx, adopt_lock_t, Context* __context, milliseconds __chkTimeout = kDefaultCondChkTime) - : _M_mtx(&__mtx), _M_owns(true), _M_context(__context), _M_chkTimeout(__chkTimeout) { - assertrx(_M_context); - } - explicit contexted_shared_lock(MutexType& __mtx, try_to_lock_t, Context* __context, milliseconds __chkTimeout = kDefaultCondChkTime) - : _M_mtx(&__mtx), _M_owns(__mtx.try_lock()), _M_context(__context), _M_chkTimeout(__chkTimeout) { - assertrx(_M_context); - } - contexted_shared_lock(contexted_shared_lock&& lck) + explicit contexted_shared_lock(MutexType& __mtx, adopt_lock_t, Context& __context, + milliseconds __chkTimeout = kDefaultCondChkTime) noexcept + : _M_mtx(&__mtx), _M_owns(true), _M_context(&__context), _M_chkTimeout(__chkTimeout) {} + explicit contexted_shared_lock(MutexType& __mtx, try_to_lock_t, Context& __context, milliseconds __chkTimeout = kDefaultCondChkTime) + : _M_mtx(&__mtx), _M_owns(__mtx.try_lock()), _M_context(&__context), _M_chkTimeout(__chkTimeout) {} + contexted_shared_lock(contexted_shared_lock&& lck) noexcept : _M_mtx(lck._M_mtx), _M_owns(lck._M_owns), _M_context(lck._M_context), _M_chkTimeout(lck._M_chkTimeout) { lck._M_owns = false; lck._M_mtx = nullptr; @@ -144,7 +135,7 @@ class contexted_shared_lock { contexted_shared_lock(const contexted_shared_lock&) = delete; contexted_shared_lock& operator=(const contexted_shared_lock&) = delete; - contexted_shared_lock& operator=(contexted_shared_lock&& lck) { + contexted_shared_lock& operator=(contexted_shared_lock&& lck) noexcept { if (this != &lck) { if (_M_owns) unlock(); _M_mtx = lck._M_mtx; @@ -196,7 +187,7 @@ class contexted_shared_lock { MutexType* mutex() const noexcept { return _M_mtx; } private: - void _M_lockable() const { + void _M_lockable() const noexcept { if (_M_mtx == nullptr) assertrx(0); if (_M_owns) assertrx(0); } diff --git a/cpp_src/estl/h_vector.h b/cpp_src/estl/h_vector.h index 1f26945d3..bcba9a7b0 100644 --- a/cpp_src/estl/h_vector.h +++ b/cpp_src/estl/h_vector.h @@ -5,6 +5,7 @@ #include #include #include +#include #include "debug_macros.h" #include "trivial_reverse_iterator.h" diff --git a/cpp_src/gtests/tests/API/api.cc b/cpp_src/gtests/tests/API/api.cc index bdb97049f..cf14719c5 100644 --- a/cpp_src/gtests/tests/API/api.cc +++ b/cpp_src/gtests/tests/API/api.cc @@ -1,9 +1,19 @@ #include #include "gtest/gtest.h" +#include "tools/assertrx.h" +#include "tools/fsops.h" -int main(int argc, char* argv[]) { +int main(int argc, char *argv[]) { srand(time(NULL)); ::testing::InitGoogleTest(&argc, argv); + +#ifndef _WIN32 + const char *tmpDir = getenv("REINDEXER_TEST_DB_ROOT"); + if (tmpDir && *tmpDir) { + reindexer::fs::SetTempDir(std::string(tmpDir)); + } +#endif // _WIN32 + return RUN_ALL_TESTS(); } diff --git a/cpp_src/gtests/tests/fixtures/fuzzing/index.cc b/cpp_src/gtests/tests/fixtures/fuzzing/index.cc index cb9f50d4e..17f7f9c59 100644 --- a/cpp_src/gtests/tests/fixtures/fuzzing/index.cc +++ b/cpp_src/gtests/tests/fixtures/fuzzing/index.cc @@ -13,7 +13,7 @@ reindexer::IndexDef Index::IndexDef(RandomGenerator& rnd, const NsScheme& scheme IndexOpts opts; const bool pk = rnd.PkIndex(isPk_); opts.PK(pk); - opts.Array(rnd.RndArrayField(isArray_) == IsArray::Yes); + opts.Array(rnd.RndArrayField(isArray_) == IsArrayT::Yes); opts.Sparse(rnd.RndSparseIndex(isSparse_)); opts.Dense(rnd.DenseIndex()); opts.RTreeType(static_cast(rnd.RndInt(IndexOpts::Linear, IndexOpts::RStar))); @@ -58,7 +58,7 @@ void Index::Dump(std::ostream& os, const NsScheme& scheme, size_t offset) const for (size_t i = 0; i <= offset; ++i) os << " "; os << "array: " << std::boolalpha << IsArray() << '\n'; for (size_t i = 0; i <= offset; ++i) os << " "; - os << "sparse: " << std::boolalpha << (IsSparse() == IsSparse::Yes) << '\n'; + os << "sparse: " << std::boolalpha << (IsSparse() == IsSparseT::Yes) << '\n'; for (size_t i = 0; i <= offset; ++i) os << " "; std::visit(reindexer::overloaded{[&](const Child& child) { os << "composite: false\n"; diff --git a/cpp_src/gtests/tests/fixtures/fuzzing/index.h b/cpp_src/gtests/tests/fixtures/fuzzing/index.h index 80407211c..4fe90a47b 100644 --- a/cpp_src/gtests/tests/fixtures/fuzzing/index.h +++ b/cpp_src/gtests/tests/fixtures/fuzzing/index.h @@ -22,9 +22,9 @@ class Index { }; using Children = std::vector; - Index(std::string name, IndexType type, IsArray isArray, IsSparse isSparse, Children content) noexcept + Index(std::string name, IndexType type, IsArrayT isArray, IsSparseT isSparse, Children content) noexcept : name_{std::move(name)}, type_{type}, content_{std::move(content)}, isArray_{isArray}, isSparse_{isSparse} {} - Index(std::string name, IndexType type, IsArray isArray, IsSparse isSparse, Child content) noexcept + Index(std::string name, IndexType type, IsArrayT isArray, IsSparseT isSparse, Child content) noexcept : name_{std::move(name)}, type_{type}, content_{std::move(content)}, isArray_{isArray}, isSparse_{isSparse} {} const std::string& Name() const& noexcept { return name_; } @@ -34,7 +34,7 @@ class Index { const auto& Content() const&& = delete; bool IsPk() const noexcept { return isPk_; } void SetPk() noexcept { isPk_ = true; } - bool IsArray() const noexcept { return isArray_ == IsArray::Yes; } + bool IsArray() const noexcept { return isArray_ == IsArrayT::Yes; } auto IsSparse() const noexcept { return isSparse_; } reindexer::IndexDef IndexDef(RandomGenerator&, const NsScheme&, const std::vector&) const; @@ -46,8 +46,8 @@ class Index { IndexType type_; std::variant content_; bool isPk_{false}; - enum IsArray isArray_ { IsArray::No }; - enum IsSparse isSparse_ { IsSparse::No }; + IsArrayT isArray_{IsArrayT::No}; + IsSparseT isSparse_{IsSparseT::No}; }; } // namespace fuzzing diff --git a/cpp_src/gtests/tests/fixtures/fuzzing/ns.cc b/cpp_src/gtests/tests/fixtures/fuzzing/ns.cc index 5a520d4a0..831653a84 100644 --- a/cpp_src/gtests/tests/fixtures/fuzzing/ns.cc +++ b/cpp_src/gtests/tests/fixtures/fuzzing/ns.cc @@ -99,7 +99,7 @@ Ns::Ns(std::string name, RandomGenerator::ErrFactorType errorFactor) usedIndexNames.insert(name); } - indexes_.emplace_back(std::move(name), indexType, rndGen_.RndArrayField(array ? IsArray::Yes : IsArray::No), IsSparse::No, + indexes_.emplace_back(std::move(name), indexType, rndGen_.RndArrayField(array ? IsArrayT::Yes : IsArrayT::No), IsSparseT::No, std::move(children)); } else { FieldPath fldPath; @@ -113,8 +113,8 @@ Ns::Ns(std::string name, RandomGenerator::ErrFactorType errorFactor) if (!rndGen_.RndErr()) continue; const auto fldType = rndGen_.RndFieldType(); indexes_.emplace_back(rndGen_.IndexName(usedIndexNames), rndGen_.RndIndexType({fldType}), - rndGen_.RndBool(0.5) ? IsArray::Yes : IsArray::No, - rndGen_.RndBool(0.5) ? IsSparse::Yes : IsSparse::No, Index::Child{fldType, std::move(fldPath)}); + rndGen_.RndBool(0.5) ? IsArrayT::Yes : IsArrayT::No, + rndGen_.RndBool(0.5) ? IsSparseT::Yes : IsSparseT::No, Index::Child{fldType, std::move(fldPath)}); } else { const auto fldType = scheme_.GetFieldType(fldPath); const auto isArray = scheme_.IsArray(fldPath); @@ -132,7 +132,7 @@ Ns::Ns(std::string name, RandomGenerator::ErrFactorType errorFactor) rndGen_.RndSparseIndex(fldType), Index::Child{fldType, std::move(fldPath)}); } if (const auto& idx = indexes_.back(); - !idx.IsArray() && idx.IsSparse() == IsSparse::No && + !idx.IsArray() && idx.IsSparse() == IsSparseT::No && std::get(idx.Content()).type != FieldType::Point) { // TODO remove point check after #1352 scalarIndexes.push_back(indexes_.size() - 1); } @@ -145,7 +145,7 @@ Ns::Ns(std::string name, RandomGenerator::ErrFactorType errorFactor) std::vector ii; for (size_t i = 0, s = indexes_.size(); i < s; ++i) { const auto& idx = indexes_[i]; - if (!idx.IsArray() && idx.IsSparse() == IsSparse::No && availablePkIndexType(idx.Type()) && + if (!idx.IsArray() && idx.IsSparse() == IsSparseT::No && availablePkIndexType(idx.Type()) && (std::holds_alternative(idx.Content()) || availablePkFieldType(std::get(idx.Content()).type))) { ii.push_back(i); } @@ -163,7 +163,7 @@ Ns::Ns(std::string name, RandomGenerator::ErrFactorType errorFactor) usedIndexNames.insert(name); } } - indexes_.emplace_back(std::move(name), rndGen_.RndPkIndexType({fldType}), IsArray::No, IsSparse::No, + indexes_.emplace_back(std::move(name), rndGen_.RndPkIndexType({fldType}), IsArrayT::No, IsSparseT::No, Index::Child{fldType, std::move(path)}); indexes_.back().SetPk(); } else { diff --git a/cpp_src/gtests/tests/fixtures/fuzzing/ns_scheme.cc b/cpp_src/gtests/tests/fixtures/fuzzing/ns_scheme.cc index 8c027dbc6..0a1c92829 100644 --- a/cpp_src/gtests/tests/fixtures/fuzzing/ns_scheme.cc +++ b/cpp_src/gtests/tests/fixtures/fuzzing/ns_scheme.cc @@ -77,13 +77,13 @@ size_t NsScheme::FieldsCount(const FieldPath& path) const noexcept { ref[path.back()].content); } -IsArray NsScheme::IsArray(const FieldPath& path) const noexcept { +IsArrayT NsScheme::IsArray(const FieldPath& path) const noexcept { if (path.empty()) return ns_.array; const Node::Children* ptr = &std::get(ns_.content); for (size_t i = 0, s = path.size() - 1; i < s; ++i) { assertrx(ptr->size() > path[i]); const auto& idx = (*ptr)[path[i]]; - if (idx.array == IsArray::Yes) return IsArray::Yes; + if (idx.array == IsArrayT::Yes) return IsArrayT::Yes; std::visit( reindexer::overloaded{[&ptr](const Node::Children& c) noexcept { ptr = &c; }, [](const Node::Child&) noexcept { assertrx(0); }}, idx.content); @@ -127,16 +127,16 @@ std::string NsScheme::GetJsonPath(const FieldPath& path) const noexcept { return res; } -void NsScheme::AddIndex(const FieldPath& path, size_t index, IsSparse isSparse) { +void NsScheme::AddIndex(const FieldPath& path, size_t index, IsSparseT isSparse) { assertrx(!path.empty()); - if (isSparse == IsSparse::No) { - ns_.sparse = IsSparse::No; + if (isSparse == IsSparseT::No) { + ns_.sparse = IsSparseT::No; } Node::Children* ptr = &std::get(ns_.content); for (size_t i = 0, s = path.size() - 1; i < s; ++i) { assertrx(ptr->size() > path[i]); - if (isSparse == IsSparse::No) { - (*ptr)[path[i]].sparse = IsSparse::No; + if (isSparse == IsSparseT::No) { + (*ptr)[path[i]].sparse = IsSparseT::No; } std::visit(reindexer::overloaded{[&ptr](Node::Children& c) noexcept { ptr = &c; }, [](Node::Child&) noexcept { assertrx(0); }}, (*ptr)[path[i]].content); @@ -148,14 +148,14 @@ void NsScheme::AddIndex(const FieldPath& path, size_t index, IsSparse isSparse) FieldPath NsScheme::AddRndPkField(RandomGenerator& rnd) { auto& children = std::get(ns_.content); children.emplace_back(Node{rnd.FieldName(generatedNames_), Node::Child{rnd.RndPkIndexFieldType()}}); - children.back().array = IsArray::No; - children.back().sparse = IsSparse::No; + children.back().array = IsArrayT::No; + children.back().sparse = IsSparseT::No; return {children.size() - 1}; } -void NsScheme::addIndex(Node& node, size_t index, IsSparse isSparse) { - if (isSparse == IsSparse::No) { - node.sparse = IsSparse::No; +void NsScheme::addIndex(Node& node, size_t index, IsSparseT isSparse) { + if (isSparse == IsSparseT::No) { + node.sparse = IsSparseT::No; } std::visit(reindexer::overloaded{[index](Node::Child& c) noexcept { c.indexes.push_back(index); }, [](Node::Children&) noexcept { assertrx(0); }}, @@ -175,14 +175,14 @@ void NsScheme::fillChildren(Node::Children& children, RandomGenerator& rnd, unsi children.back().array = rnd.RndArrayField(); } if (!canBeSparse && !rnd.RndErr()) { - children.back().sparse = IsSparse::No; + children.back().sparse = IsSparseT::No; } } else { children.emplace_back(Node{std::move(fName), Node::Child{type}}); if (type == FieldType::Point) { canBeSparse = false; canBeArray = false; - children.back().sparse = IsSparse::No; + children.back().sparse = IsSparseT::No; } if (canBeArray || rnd.RndErr()) { children.back().array = rnd.RndArrayField(); @@ -256,7 +256,7 @@ void NsScheme::toJson(reindexer::JsonBuilder& builder, const Node::Children& chi const std::vector& indexes) { for (const Node& n : children) { if (!rnd.NeedThisNode(n.sparse)) continue; - if (rnd.RndArrayField(n.array) == IsArray::Yes) { + if (rnd.RndArrayField(n.array) == IsArrayT::Yes) { auto arr = builder.Array(n.name); const size_t arrSize = rnd.ArraySize(); for (size_t i = 0; i < arrSize; ++i) { @@ -294,9 +294,9 @@ void NsScheme::Node::Dump(std::ostream& os, size_t offset) const { for (size_t i = 0; i <= offset; ++i) os << " "; os << "name: " << name << '\n'; for (size_t i = 0; i <= offset; ++i) os << " "; - os << "sparse: " << std::boolalpha << (sparse == IsSparse::Yes) << '\n'; + os << "sparse: " << std::boolalpha << (sparse == IsSparseT::Yes) << '\n'; for (size_t i = 0; i <= offset; ++i) os << " "; - os << "array: " << std::boolalpha << (array == IsArray::Yes) << '\n'; + os << "array: " << std::boolalpha << (array == IsArrayT::Yes) << '\n'; std::visit(reindexer::overloaded{[&](const Child& child) { for (size_t i = 0; i <= offset; ++i) os << " "; os << "type: " << child.type << '\n'; diff --git a/cpp_src/gtests/tests/fixtures/fuzzing/ns_scheme.h b/cpp_src/gtests/tests/fixtures/fuzzing/ns_scheme.h index a63a76e38..8123d726f 100644 --- a/cpp_src/gtests/tests/fixtures/fuzzing/ns_scheme.h +++ b/cpp_src/gtests/tests/fixtures/fuzzing/ns_scheme.h @@ -29,8 +29,8 @@ class NsScheme { std::string name; std::variant content; - IsSparse sparse{IsSparse::Yes}; - IsArray array{IsArray::No}; + IsSparseT sparse{IsSparseT::Yes}; + IsArrayT array{IsArrayT::No}; void Dump(std::ostream&, size_t offset) const; }; @@ -43,17 +43,17 @@ class NsScheme { bool IsStruct(const FieldPath&) const noexcept; bool IsPoint(const FieldPath&) const noexcept; bool IsTtl(const FieldPath&, const std::vector&) const noexcept; - enum IsArray IsArray(const FieldPath&) const noexcept; + IsArrayT IsArray(const FieldPath&) const noexcept; FieldType GetFieldType(const FieldPath&) const noexcept; void SetFieldType(const FieldPath&, FieldType) noexcept; std::string GetJsonPath(const FieldPath&) const noexcept; - void AddIndex(const FieldPath&, size_t index, IsSparse); + void AddIndex(const FieldPath&, size_t index, IsSparseT); void NewItem(reindexer::WrSerializer&, RandomGenerator&, const std::vector&); void Dump(std::ostream& os, size_t offset) const { ns_.Dump(os, offset); } FieldPath AddRndPkField(RandomGenerator&); private: - static void addIndex(Node&, size_t index, IsSparse); + static void addIndex(Node&, size_t index, IsSparseT); void fillChildren(Node::Children&, RandomGenerator&, unsigned level, bool& canBeArray, bool& canBeSparse); const Node::Children& findLastContainer(const FieldPath&) const noexcept; Node::Children& findLastContainer(const FieldPath&) noexcept; diff --git a/cpp_src/gtests/tests/fixtures/fuzzing/random_generator.cc b/cpp_src/gtests/tests/fixtures/fuzzing/random_generator.cc index e207a6667..82d85a68e 100644 --- a/cpp_src/gtests/tests/fixtures/fuzzing/random_generator.cc +++ b/cpp_src/gtests/tests/fixtures/fuzzing/random_generator.cc @@ -228,7 +228,7 @@ FieldPath RandomGenerator::RndScalarField(const NsScheme& nsScheme) { const int end = idx + size; while (idx < end) { res.back() = idx % size; - if (nsScheme.IsArray(res) == IsArray::No && !nsScheme.IsPoint(res)) break; + if (nsScheme.IsArray(res) == IsArrayT::No && !nsScheme.IsPoint(res)) break; ++idx; } if (idx == end) return {}; diff --git a/cpp_src/gtests/tests/fixtures/fuzzing/random_generator.h b/cpp_src/gtests/tests/fixtures/fuzzing/random_generator.h index 4960f28c3..bebb70490 100644 --- a/cpp_src/gtests/tests/fixtures/fuzzing/random_generator.h +++ b/cpp_src/gtests/tests/fixtures/fuzzing/random_generator.h @@ -60,20 +60,20 @@ class RandomGenerator { IndexType RndIndexType(const std::vector&); IndexType RndPkIndexType(const std::vector&); IndexType RndIndexType(IndexType); - IsArray RndArrayField() { return RndBool(0.2) ? IsArray::Yes : IsArray::No; } - IsArray RndArrayField(IsArray array) { + IsArrayT RndArrayField() { return RndBool(0.2) ? IsArrayT::Yes : IsArrayT::No; } + IsArrayT RndArrayField(IsArrayT array) { if (RndErr()) { - return array == IsArray::Yes ? IsArray::No : IsArray::Yes; + return array == IsArrayT::Yes ? IsArrayT::No : IsArrayT::Yes; } return array; } size_t ArraySize(); bool PkIndex(bool pk) { return RndErr() ? RndBool(0.5) : pk; } - IsSparse RndSparseIndex(FieldType fldType) { + IsSparseT RndSparseIndex(FieldType fldType) { const bool couldBeSparse = fldType != FieldType::Struct && fldType != FieldType::Uuid; // TODO remove uuid #1470 - return (couldBeSparse ? RndBool(0.2) : RndErr()) ? IsSparse::Yes : IsSparse::No; + return (couldBeSparse ? RndBool(0.2) : RndErr()) ? IsSparseT::Yes : IsSparseT::No; } - bool RndSparseIndex(IsSparse isSparse) { return (isSparse == IsSparse::Yes) != RndErr(); } + bool RndSparseIndex(IsSparseT isSparse) { return (isSparse == IsSparseT::Yes) != RndErr(); } bool DenseIndex() { return RndBool(0.2); } int64_t ExpiredIndex() { return RndInt(0, 100'000); } // TODO size_t IndexesCount(); @@ -137,7 +137,7 @@ class RandomGenerator { return err; } char RndChar() { return rndChar_(gen_); } - bool NeedThisNode(IsSparse sparse) { return sparse == IsSparse::Yes ? RndBool(0.5) : !RndErr(); } + bool NeedThisNode(IsSparseT sparse) { return sparse == IsSparseT::Yes ? RndBool(0.5) : !RndErr(); } int RndIntValue() { enum Size : uint8_t { Short, Long, END = Long }; switch (RndWhich()) { diff --git a/cpp_src/gtests/tests/fixtures/fuzzing/types.h b/cpp_src/gtests/tests/fixtures/fuzzing/types.h index db97087c6..98ec500a8 100644 --- a/cpp_src/gtests/tests/fixtures/fuzzing/types.h +++ b/cpp_src/gtests/tests/fixtures/fuzzing/types.h @@ -23,7 +23,7 @@ enum class IndexType { Store, Hash, Tree, Ttl, FastFT, FuzzyFT, RTree, END = RTr std::string_view ToText(IndexType); std::ostream& operator<<(std::ostream&, IndexType); -enum class IsArray : bool { Yes = true, No = false }; -enum class IsSparse : bool { Yes = true, No = false }; +enum class IsArrayT : bool { Yes = true, No = false }; +enum class IsSparseT : bool { Yes = true, No = false }; } // namespace fuzzing diff --git a/cpp_src/readme.md b/cpp_src/readme.md index 05c6e0cfb..b496cca9e 100644 --- a/cpp_src/readme.md +++ b/cpp_src/readme.md @@ -46,7 +46,7 @@ yum update yum install reindexer-server ``` -Available distros: `centos-7`, `fedora-36`, `fedora-37`, `redos-7` +Available distros: `centos-7`, `fedora-38`, `fedora-39`, `redos-7` ### Ubuntu/Debian diff --git a/cpp_src/server/contrib/server.yml b/cpp_src/server/contrib/server.yml index 2df0c33cd..bdc4fe6bc 100644 --- a/cpp_src/server/contrib/server.yml +++ b/cpp_src/server/contrib/server.yml @@ -2738,8 +2738,8 @@ definitions: type: integer default: 20000 minimum: 0 - maximum: 65535 - description: "Maximum documents count which will be processed in merge query results. Increasing this value may refine ranking of queries with high frequency words, but will decrease search speed" + maximum: 65000 + description: "Maximum documents count which will be processed in merge query results. Increasing this value may refine ranking of queries with high frequency words, but will decrease search speed" extra_word_symbols: type: string default: "-/+" @@ -3984,7 +3984,14 @@ definitions: description: "Enable network traffic compression" cluster_id: type: integer + default: 2 description: "Cluser ID - must be same for client and for master" + server_id: + type: integer + default: 0 + minimun: 0 + maximum: 999 + description: "Node identifier. Should be unique for each node in the replicated cluster (non-unique IDs are also allowed, but may lead to the inconsistency in some cases" force_sync_on_logic_error: type: boolean description: "force resync on logic error conditions" diff --git a/cpp_src/server/httpserver.cc b/cpp_src/server/httpserver.cc index 65bd6dc2f..27e2adc13 100644 --- a/cpp_src/server/httpserver.cc +++ b/cpp_src/server/httpserver.cc @@ -226,11 +226,9 @@ int HTTPServer::GetDatabases(http::Context &ctx) { } if (sortDirection) { - std::sort(dbs.begin(), dbs.end(), [sortDirection](const std::string &lhs, const std::string &rhs) { - if (sortDirection > 0) - return collateCompare(lhs, rhs, SortingPrioritiesTable()) < 0; - else - return collateCompare(lhs, rhs, SortingPrioritiesTable()) > 0; + boost::sort::pdqsort(dbs.begin(), dbs.end(), [sortDirection](const std::string &lhs, const std::string &rhs) { + return (sortDirection > 0) ? (collateCompare(lhs, rhs, SortingPrioritiesTable()) < 0) + : (collateCompare(lhs, rhs, SortingPrioritiesTable()) > 0); }); } @@ -320,11 +318,9 @@ int HTTPServer::GetNamespaces(http::Context &ctx) { } if (sortDirection) { - std::sort(nsDefs.begin(), nsDefs.end(), [sortDirection](const NamespaceDef &lhs, const NamespaceDef &rhs) { - if (sortDirection > 0) - return collateCompare(lhs.name, rhs.name, SortingPrioritiesTable()) < 0; - else - return collateCompare(lhs.name, rhs.name, SortingPrioritiesTable()) > 0; + boost::sort::pdqsort(nsDefs.begin(), nsDefs.end(), [sortDirection](const NamespaceDef &lhs, const NamespaceDef &rhs) { + return (sortDirection > 0) ? (collateCompare(lhs.name, rhs.name, SortingPrioritiesTable()) < 0) + : (collateCompare(lhs.name, rhs.name, SortingPrioritiesTable()) > 0); }); } @@ -543,9 +539,9 @@ int HTTPServer::GetMetaList(http::Context &ctx) { return jsonStatus(ctx, http::HttpStatus(err)); } if (sortDirection == Asc) { - std::sort(keys.begin(), keys.end()); + boost::sort::pdqsort(keys.begin(), keys.end()); } else if (sortDirection == Desc) { - std::sort(keys.begin(), keys.end(), std::greater()); + boost::sort::pdqsort(keys.begin(), keys.end(), std::greater()); } auto keysIt = keys.begin(); auto keysEnd = keys.end(); diff --git a/cpp_src/tools/fsops.cc b/cpp_src/tools/fsops.cc index e7d8db748..5fbfcae71 100644 --- a/cpp_src/tools/fsops.cc +++ b/cpp_src/tools/fsops.cc @@ -5,6 +5,7 @@ #include #include #include +#include #include "errors.h" #include "tools/oscompat.h" @@ -177,7 +178,16 @@ std::string GetCwd() { return std::string(getcwd(buff, FILENAME_MAX)); } +static std::string tmpDir; +static std::mutex tmpDirMtx; + std::string GetTempDir() { + { + std::lock_guard lck(tmpDirMtx); + if (!tmpDir.empty()) { + return tmpDir; + } + } #ifdef _WIN32 char tmpBuf[512]; *tmpBuf = 0; @@ -190,6 +200,11 @@ std::string GetTempDir() { #endif } +void SetTempDir(std::string &&dir) noexcept { + std::lock_guard lck(tmpDirMtx); + tmpDir = std::move(dir); +} + std::string GetHomeDir() { const char *homeDir = getenv("HOME"); if (homeDir && *homeDir) return homeDir; @@ -355,5 +370,6 @@ std::string GetRelativePath(const std::string &path, unsigned maxUp) { rpath.append(path.begin() + same, path.end()); return rpath; } + } // namespace fs } // namespace reindexer diff --git a/cpp_src/tools/fsops.h b/cpp_src/tools/fsops.h index 46d56db4c..015ef0a66 100644 --- a/cpp_src/tools/fsops.h +++ b/cpp_src/tools/fsops.h @@ -37,6 +37,7 @@ TimeStats StatTime(const std::string &path); std::string GetCwd(); std::string GetDirPath(const std::string &path); std::string GetTempDir(); +void SetTempDir(std::string &&dir) noexcept; std::string GetHomeDir(); std::string GetRelativePath(const std::string &path, unsigned maxUp = 1024); inline int Rename(const std::string &from, const std::string &to) { return rename(from.c_str(), to.c_str()); } diff --git a/cpp_src/tools/jsonstring.h b/cpp_src/tools/jsonstring.h index 34c6eeb56..36601af0a 100644 --- a/cpp_src/tools/jsonstring.h +++ b/cpp_src/tools/jsonstring.h @@ -71,12 +71,15 @@ inline void encode(uint8_t *p, uint64_t l, std::vector> p[-3] = (uptr >> 8) & 0xFF; p[-4] = (uptr >> 16) & 0xFF; p[-5] = (uptr >> 24) & 0xFF; - if constexpr (sizeof(uintptr_t) == 8) { - p[-6] = (uptr >> 32) & 0xFF; - p[-7] = (uptr >> 40) & 0xFF; - p[-8] = (uptr >> 48) & 0xFF; - p[-9] = (uptr >> 56) & 0xFF; - } +#if UINTPTR_MAX == 0xFFFFFFFF +#elif UINTPTR_MAX == 0xFFFFFFFFFFFFFFFF + p[-6] = (uptr >> 32) & 0xFF; + p[-7] = (uptr >> 40) & 0xFF; + p[-8] = (uptr >> 48) & 0xFF; + p[-9] = (uptr >> 56) & 0xFF; +#else + static_assert(false, "Unexpected uintptr_t size"); +#endif } else { // Put length p[0] = l & 0xFF; diff --git a/cpp_src/vendor/gason/gason.h b/cpp_src/vendor/gason/gason.h index 6e227f7a8..76c218d37 100644 --- a/cpp_src/vendor/gason/gason.h +++ b/cpp_src/vendor/gason/gason.h @@ -6,6 +6,7 @@ #include #include #include +#include #include #include "estl/span.h" #include "tools/jsonstring.h" diff --git a/describer.go b/describer.go index ed494bed8..b356b3cba 100644 --- a/describer.go +++ b/describer.go @@ -85,7 +85,7 @@ type CacheMemStat struct { type LsnT struct { // Operation counter Counter int64 `json:"counter"` - // Node identifyer + // Node identifier ServerId int `json:"server_id"` } diff --git a/fulltext.md b/fulltext.md index e741225a2..672ab7e52 100644 --- a/fulltext.md +++ b/fulltext.md @@ -378,10 +378,10 @@ FtTyposDetailedConfig: config for more precise typos algorithm tuning. | | Parameter name | Type | Description | Default value | |---|:----------------------------:|:--------:|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|:-------------:| -| | MaxTypoDistance | int | Maximum distance between symbols in initial and target words to perform substitution. Check [typos handling](#typos-handling-details) section for detailed description. | 0 | -| | MaxSymbolPermutationDistance | int | aximum distance between same symbols in initial and target words to perform substitution (to handle cases, when two symbolws were switched with each other). Check [typos handling](#typos-handling-details) section for detailed description. | 1 | -| | MaxMissingLetters | int | Maximum number of symbols, which may be removed from the initial term to transform it into the result word. Check [typos handling](#typos-handling-details) section for detailed description. | 2 | -| | MaxExtraLetters | int | Maximum number of symbols, which may be added to the initial term to transform it into the result word. Check [typos handling](#typos-handling-details) section for detailed description. | 2 | +| | MaxTypoDistance | int | Maximum distance between symbols in initial and target words to perform substitution. Check [typos handling](#typos-handling-details) section for detailed description. | 0 | +| | MaxSymbolPermutationDistance | int | aximum distance between same symbols in initial and target words to perform substitution (to handle cases, when two symbolws were switched with each other). Check [typos handling](#typos-handling-details) section for detailed description. | 1 | +| | MaxMissingLetters | int | Maximum number of symbols, which may be removed from the initial term to transform it into the result word. Check [typos handling](#typos-handling-details) section for detailed description. | 2 | +| | MaxExtraLetters | int | Maximum number of symbols, which may be added to the initial term to transform it into the result word. Check [typos handling](#typos-handling-details) section for detailed description. | 2 | ### Base ranking config diff --git a/test/fields_autogen_test.go b/test/fields_autogen_test.go index 0813cb0af..2f25b6176 100644 --- a/test/fields_autogen_test.go +++ b/test/fields_autogen_test.go @@ -26,6 +26,9 @@ func init() { } func TestAutogen(t *testing.T) { + + currentSerial := 0 + t.Run("field should be updated with current timestamp using NOW() function", func(t *testing.T) { precepts := []string{"updated_time=NOW()"} item := TestItemAutogen{} @@ -51,9 +54,10 @@ func TestAutogen(t *testing.T) { item := TestItemAutogen{} err := DB.Upsert(ns, &item, precepts...) require.NoError(t, err) + currentSerial += 1 - assert.Equal(t, 1, item.Age) - assert.Equal(t, int64(1), item.Genre) + assert.Equal(t, currentSerial, item.Age) + assert.Equal(t, int64(currentSerial), item.Genre) t.Run("serial field should be increased by 5 after 5 iterations (must be equal 6 after previous test)", func(t *testing.T) { precepts := []string{"genre=SERIAL()", "age=serial()"} @@ -61,70 +65,84 @@ func TestAutogen(t *testing.T) { for i := 0; i < 5; i++ { err := DB.Upsert(ns, &item, precepts...) require.NoError(t, err) + currentSerial += 1 } - assert.Equal(t, 6, item.Age) - assert.Equal(t, int64(6), item.Genre) + assert.Equal(t, currentSerial, item.Age) + assert.Equal(t, int64(currentSerial), item.Genre) }) }) t.Run("fill on insert, update, upsert", func(t *testing.T) { - precepts := []string{"updated_time=NOW()"} + precepts := []string{"updated_time=NOW()", "age=SERIAL()"} item := TestItemAutogen{ID: rand.Intn(100000000)} _, err := DB.Insert(ns, &item, precepts...) require.NoError(t, err) + currentSerial += 1 assert.GreaterOrEqual(t, item.UpdatedTime, time.Now().Unix()-1) assert.LessOrEqual(t, item.UpdatedTime, time.Now().Unix()) + assert.Equal(t, currentSerial, item.Age) item = TestItemAutogen{} err = DB.Upsert(ns, &item, precepts...) require.NoError(t, err) + currentSerial += 1 assert.GreaterOrEqual(t, item.UpdatedTime, time.Now().Unix()-1) assert.LessOrEqual(t, item.UpdatedTime, time.Now().Unix()) + assert.Equal(t, currentSerial, item.Age) item = TestItemAutogen{} _, err = DB.Update(ns, &item, precepts...) require.NoError(t, err) + currentSerial += 1 assert.GreaterOrEqual(t, item.UpdatedTime, time.Now().Unix()-1) assert.LessOrEqual(t, item.UpdatedTime, time.Now().Unix()) + assert.Equal(t, currentSerial, item.Age) }) - t.Run("fill on upsert not exist item", func(t *testing.T) { - precepts := []string{"updated_time=NOW()"} + t.Run("fill on upsert nonexist item", func(t *testing.T) { + precepts := []string{"updated_time=NOW()", "age=SERIAL()"} item := TestItemAutogen{ID: rand.Intn(100000000)} err := DB.Upsert(ns, &item, precepts...) require.NoError(t, err) + currentSerial += 1 assert.GreaterOrEqual(t, item.UpdatedTime, time.Now().Unix()-1) assert.LessOrEqual(t, item.UpdatedTime, time.Now().Unix()) + assert.Equal(t, currentSerial, item.Age) }) - t.Run("not fill on update not exist item", func(t *testing.T) { - precepts := []string{"updated_time=NOW()"} + t.Run("doesn't fill on update nonexist item", func(t *testing.T) { + precepts := []string{"updated_time=NOW()", "age=SERIAL()"} item := TestItemAutogen{ID: rand.Intn(100000000)} count, err := DB.Update(ns, &item, precepts...) require.NoError(t, err) + currentSerial += 1 // remove after 1602 assert.Equal(t, 0, count) assert.Equal(t, int64(0), item.UpdatedTime) + assert.Equal(t, 0, item.Age) }) - t.Run("not fill on insert exist item", func(t *testing.T) { - precepts := []string{"updated_time=NOW()"} + t.Run("doesn't fill on insert exist item", func(t *testing.T) { + precepts := []string{"updated_time=NOW()", "age=SERIAL()"} id := rand.Intn(100000000) item := TestItemAutogen{ID: id} count, err := DB.Insert(ns, &item, precepts...) require.NoError(t, err) + currentSerial += 1 assert.Equal(t, 1, count) assert.GreaterOrEqual(t, item.UpdatedTime, time.Now().Unix()-1) assert.LessOrEqual(t, item.UpdatedTime, time.Now().Unix()) + assert.Equal(t, currentSerial, item.Age) item = TestItemAutogen{ID: id} count, err = DB.Insert(ns, &item, precepts...) require.NoError(t, err) assert.Equal(t, 0, count) assert.Equal(t, int64(0), item.UpdatedTime) + assert.Equal(t, 0, item.Age) }) }