Loading core/src/scheduler/SchedInst.h +4 −0 Original line number Diff line number Diff line Loading @@ -25,6 +25,7 @@ #include "optimizer/BuildIndexPass.h" #include "optimizer/FaissFlatPass.h" #include "optimizer/FaissIVFFlatPass.h" #include "optimizer/FaissIVFPQPass.h" #include "optimizer/FaissIVFSQ8HPass.h" #include "optimizer/FaissIVFSQ8Pass.h" #include "optimizer/FallbackPass.h" Loading Loading @@ -129,7 +130,10 @@ class OptimizerInst { pass_list.push_back(std::make_shared<FaissFlatPass>()); pass_list.push_back(std::make_shared<FaissIVFFlatPass>()); pass_list.push_back(std::make_shared<FaissIVFSQ8Pass>()); #ifdef CUSTOMIZATION pass_list.push_back(std::make_shared<FaissIVFSQ8HPass>()); #endif pass_list.push_back(std::make_shared<FaissIVFPQPass>()); } #endif pass_list.push_back(std::make_shared<FallbackPass>()); Loading core/src/scheduler/optimizer/FaissIVFPQPass.cpp 0 → 100644 +74 −0 Original line number Diff line number Diff line // Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. #ifdef MILVUS_GPU_VERSION #include "scheduler/optimizer/FaissIVFPQPass.h" #include "cache/GpuCacheMgr.h" #include "scheduler/SchedInst.h" #include "scheduler/Utils.h" #include "scheduler/task/SearchTask.h" #include "scheduler/tasklabel/SpecResLabel.h" #include "server/Config.h" #include "utils/Log.h" namespace milvus { namespace scheduler { void FaissIVFPQPass::Init() { #ifdef MILVUS_GPU_VERSION server::Config& config = server::Config::GetInstance(); Status s = config.GetEngineConfigGpuSearchThreshold(threshold_); if (!s.ok()) { threshold_ = std::numeric_limits<int32_t>::max(); } s = config.GetGpuResourceConfigSearchResources(gpus); if (!s.ok()) { throw; } #endif } bool FaissIVFPQPass::Run(const TaskPtr& task) { if (task->Type() != TaskType::SearchTask) { return false; } auto search_task = std::static_pointer_cast<XSearchTask>(task); if (search_task->file_->engine_type_ != (int)engine::EngineType::FAISS_PQ) { return false; } auto search_job = std::static_pointer_cast<SearchJob>(search_task->job_.lock()); ResourcePtr res_ptr; if (search_job->nq() < threshold_) { SERVER_LOG_DEBUG << "FaissIVFPQPass: nq < gpu_search_threshold, specify cpu to search!"; res_ptr = ResMgrInst::GetInstance()->GetResource("cpu"); } else { auto best_device_id = count_ % gpus.size(); SERVER_LOG_DEBUG << "FaissIVFPQPass: nq > gpu_search_threshold, specify gpu" << best_device_id << " to search!"; count_++; res_ptr = ResMgrInst::GetInstance()->GetResource(ResourceType::GPU, gpus[best_device_id]); } auto label = std::make_shared<SpecResLabel>(res_ptr); task->label() = label; return true; } } // namespace scheduler } // namespace milvus #endif core/src/scheduler/optimizer/FaissIVFPQPass.h 0 → 100644 +58 −0 Original line number Diff line number Diff line // Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. #ifdef MILVUS_GPU_VERSION #pragma once #include <condition_variable> #include <deque> #include <limits> #include <list> #include <memory> #include <mutex> #include <queue> #include <string> #include <thread> #include <unordered_map> #include <vector> #include "Pass.h" namespace milvus { namespace scheduler { class FaissIVFPQPass : public Pass { public: FaissIVFPQPass() = default; public: void Init() override; bool Run(const TaskPtr& task) override; private: int64_t threshold_ = std::numeric_limits<int64_t>::max(); int64_t count_ = 0; std::vector<int64_t> gpus; }; using FaissIVFPQPassPtr = std::shared_ptr<FaissIVFPQPass>; } // namespace scheduler } // namespace milvus #endif Loading
core/src/scheduler/SchedInst.h +4 −0 Original line number Diff line number Diff line Loading @@ -25,6 +25,7 @@ #include "optimizer/BuildIndexPass.h" #include "optimizer/FaissFlatPass.h" #include "optimizer/FaissIVFFlatPass.h" #include "optimizer/FaissIVFPQPass.h" #include "optimizer/FaissIVFSQ8HPass.h" #include "optimizer/FaissIVFSQ8Pass.h" #include "optimizer/FallbackPass.h" Loading Loading @@ -129,7 +130,10 @@ class OptimizerInst { pass_list.push_back(std::make_shared<FaissFlatPass>()); pass_list.push_back(std::make_shared<FaissIVFFlatPass>()); pass_list.push_back(std::make_shared<FaissIVFSQ8Pass>()); #ifdef CUSTOMIZATION pass_list.push_back(std::make_shared<FaissIVFSQ8HPass>()); #endif pass_list.push_back(std::make_shared<FaissIVFPQPass>()); } #endif pass_list.push_back(std::make_shared<FallbackPass>()); Loading
core/src/scheduler/optimizer/FaissIVFPQPass.cpp 0 → 100644 +74 −0 Original line number Diff line number Diff line // Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. #ifdef MILVUS_GPU_VERSION #include "scheduler/optimizer/FaissIVFPQPass.h" #include "cache/GpuCacheMgr.h" #include "scheduler/SchedInst.h" #include "scheduler/Utils.h" #include "scheduler/task/SearchTask.h" #include "scheduler/tasklabel/SpecResLabel.h" #include "server/Config.h" #include "utils/Log.h" namespace milvus { namespace scheduler { void FaissIVFPQPass::Init() { #ifdef MILVUS_GPU_VERSION server::Config& config = server::Config::GetInstance(); Status s = config.GetEngineConfigGpuSearchThreshold(threshold_); if (!s.ok()) { threshold_ = std::numeric_limits<int32_t>::max(); } s = config.GetGpuResourceConfigSearchResources(gpus); if (!s.ok()) { throw; } #endif } bool FaissIVFPQPass::Run(const TaskPtr& task) { if (task->Type() != TaskType::SearchTask) { return false; } auto search_task = std::static_pointer_cast<XSearchTask>(task); if (search_task->file_->engine_type_ != (int)engine::EngineType::FAISS_PQ) { return false; } auto search_job = std::static_pointer_cast<SearchJob>(search_task->job_.lock()); ResourcePtr res_ptr; if (search_job->nq() < threshold_) { SERVER_LOG_DEBUG << "FaissIVFPQPass: nq < gpu_search_threshold, specify cpu to search!"; res_ptr = ResMgrInst::GetInstance()->GetResource("cpu"); } else { auto best_device_id = count_ % gpus.size(); SERVER_LOG_DEBUG << "FaissIVFPQPass: nq > gpu_search_threshold, specify gpu" << best_device_id << " to search!"; count_++; res_ptr = ResMgrInst::GetInstance()->GetResource(ResourceType::GPU, gpus[best_device_id]); } auto label = std::make_shared<SpecResLabel>(res_ptr); task->label() = label; return true; } } // namespace scheduler } // namespace milvus #endif
core/src/scheduler/optimizer/FaissIVFPQPass.h 0 → 100644 +58 −0 Original line number Diff line number Diff line // Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. #ifdef MILVUS_GPU_VERSION #pragma once #include <condition_variable> #include <deque> #include <limits> #include <list> #include <memory> #include <mutex> #include <queue> #include <string> #include <thread> #include <unordered_map> #include <vector> #include "Pass.h" namespace milvus { namespace scheduler { class FaissIVFPQPass : public Pass { public: FaissIVFPQPass() = default; public: void Init() override; bool Run(const TaskPtr& task) override; private: int64_t threshold_ = std::numeric_limits<int64_t>::max(); int64_t count_ = 0; std::vector<int64_t> gpus; }; using FaissIVFPQPassPtr = std::shared_ptr<FaissIVFPQPass>; } // namespace scheduler } // namespace milvus #endif