From de082fedf62c987d04ae33b8c6c87a503992c260 Mon Sep 17 00:00:00 2001 From: chatlanin Date: Tue, 19 Nov 2024 10:41:10 +0300 Subject: [PATCH] start new impl --- src/meson.build | 3 +- src/pgxx/pgxx.hpp | 82 ++--------- src/pgxx/query_builder.hpp | 22 +-- src/pgxx/utils/aliases.hpp | 5 + src/pgxx/utils/define.hpp | 3 - src/pgxx/utils/using.hpp | 8 -- tests/main.cpp | 194 ++++++++++++++++++++++--- tests/thread/pool.hpp | 288 +++++++++++++++++++++++++++++++++++++ tests/thread/queue.hpp | 108 ++++++++++++++ 9 files changed, 595 insertions(+), 118 deletions(-) create mode 100644 src/pgxx/utils/aliases.hpp delete mode 100644 src/pgxx/utils/define.hpp delete mode 100644 src/pgxx/utils/using.hpp create mode 100644 tests/thread/pool.hpp create mode 100644 tests/thread/queue.hpp diff --git a/src/meson.build b/src/meson.build index 2ce7ba3..347b716 100755 --- a/src/meson.build +++ b/src/meson.build @@ -3,8 +3,7 @@ headers = [ 'pgxx/pgxx.hpp', 'pgxx/query_builder.hpp', - 'pgxx/utils/define.hpp', - 'pgxx/utils/using.hpp', + 'pgxx/utils/aliases.hpp', 'pgxx/utils/var.hpp', ] diff --git a/src/pgxx/pgxx.hpp b/src/pgxx/pgxx.hpp index 4cd20d4..b8ac01a 100644 --- a/src/pgxx/pgxx.hpp +++ b/src/pgxx/pgxx.hpp @@ -4,55 +4,45 @@ #include "hack/exception/exception.hpp" #include "hack/logger/logger.hpp" -#include "pgxx/utils/define.hpp" -#include "pgxx/utils/using.hpp" -#include "pgxx/utils/var.hpp" -#include "pgxx/query_builder.hpp" -#include "pgxx/pool_connection.hpp" +#include "utils/aliases.hpp" // IWYU pragma: keep +#include "utils/var.hpp" +#include "pool_connection.hpp" namespace pgxx { - class manager : public hack::utils::singleton + class database : public hack::utils::singleton { - friend hack::utils::singleton; + friend hack::utils::singleton; public: - ~manager() = default; + ~database() = default; private: - manager() = default; - std::map m_data_connections; + database() = default; + std::map m_connections; public: - bool ready() { return m_data_connections.size() != 0; } + bool ready() { return m_connections.size() != 0; } void init(std::string connection_name, int connection_count, std::string connection_url) { - m_data_connections[connection_name] = pool_connection { connection_count, connection_url }; + m_connections[connection_name] = pool_connection { connection_count, connection_url }; hack::log("")("make connection [", connection_name, "] completed"); } template - JSON execute(const std::string connection_name, std::string func_name, const Args&... args) + pqxx::result execute(const std::string connection_name, std::string query) { - auto query = prepare(func_name, args...); - JSON result; + pqxx::result r; try { - auto c = m_data_connections[connection_name].get(); + auto c = m_connections[connection_name].get(); - pqxx::result r; pqxx::work work { *c }; r = work.exec(query); - - std::string r_str; - for (auto row : r) r_str = row.at(0).c_str(); - work.commit(); - m_data_connections[connection_name].release(c); - - result = JSON::parse(r_str); + m_connections[connection_name].release(c); } catch (const std::exception& e) { @@ -61,15 +51,6 @@ namespace pgxx ex.system_error(e); ex.params("connection_name", connection_name); ex.params("query", query); - ex.params("result", result); - - if (connection_name == var::LOG_CONNECTION) - { - hack::error()("WARNING!!! ERROR LOG TO DATABASE"); - hack::error()("query", query); - hack::error()(e.what()); - std::terminate(); - } throw ex; } catch (...) @@ -79,44 +60,11 @@ namespace pgxx ex.message(var::EXECUTE_ERROR); ex.params("connection_name", connection_name); ex.params("query", query); - ex.params("result", result); - - if (connection_name == var::LOG_CONNECTION) - { - hack::error()("WARNING!!! ERROR LOG TO DATABASE"); - hack::error()("query", query); - std::terminate(); - } throw ex; } - return result; + return r; } - - private: - template - std::string prepare(const std::string func_name, const Args&... args) - { - std::string query; - - try - { - query = builder::make_query(func_name, args...); - } - catch (const std::exception& e) - { - hack::exception ex; - ex.description("database dont create query from args"); - ex.system_error(e); - ex.params("query", query); - ex.variadic_params(args...); - throw ex; - } - - return query; - } - - }; } diff --git a/src/pgxx/query_builder.hpp b/src/pgxx/query_builder.hpp index 294ba1d..201f7db 100644 --- a/src/pgxx/query_builder.hpp +++ b/src/pgxx/query_builder.hpp @@ -2,25 +2,22 @@ #include -#include "hack/string/string_concat_helper.hpp" #include "hack/concepts/concepts.hpp" -#include "utils/using.hpp" - namespace pgxx::builder { template std::string make_one(First f) { f = std::regex_replace(f, std::regex("'"), "[quote]"); - return hack::string::str_concat + "'" + f + "',"; + return "'" + f + "',"; } inline std::string make_one(const char* f) { auto f_str = std::string(f); f_str = std::regex_replace(f_str, std::regex("'"), "[quote]"); - return hack::string::str_concat + "'" + f_str + "',"; + return "'" + f_str + "',"; } inline std::string make_one(char f) @@ -34,35 +31,28 @@ namespace pgxx::builder { auto f_str = std::to_string(f); f_str = std::regex_replace(f_str, std::regex("'"), "[quote]"); - return hack::string::str_concat + "'" + f_str + "',"; + return "'" + f_str + "',"; } inline std::string make_one(const float f) { auto f_str = std::to_string(f); f_str = std::regex_replace(f_str, std::regex("'"), "[quote]"); - return hack::string::str_concat + f_str + ","; + return f_str + ","; } inline std::string make_one(int f) { auto f_str = std::to_string(f); f_str = std::regex_replace(f_str, std::regex("'"), "[quote]"); - return hack::string::str_concat + f_str + ","; + return f_str + ","; } inline std::string make_one(const std::string& f) { auto f_str = f; f_str = std::regex_replace(f_str, std::regex("'"), "[quote]"); - return hack::string::str_concat + "'" + f_str + "',"; - } - - inline std::string make_one(const JSON& f) - { - auto f_str = f.dump(); - f_str = std::regex_replace(f_str, std::regex("'"), "[quote]"); - return hack::string::str_concat + "'" + f_str + "'::jsonb,"; + return "'" + f_str + "',"; } // это заглушкa при компиляции пустых данных diff --git a/src/pgxx/utils/aliases.hpp b/src/pgxx/utils/aliases.hpp new file mode 100644 index 0000000..d6942a0 --- /dev/null +++ b/src/pgxx/utils/aliases.hpp @@ -0,0 +1,5 @@ +#pragma once + +#ifndef PGXX +#define PGXX() pgxx::database::instance() +#endif diff --git a/src/pgxx/utils/define.hpp b/src/pgxx/utils/define.hpp deleted file mode 100644 index f293701..0000000 --- a/src/pgxx/utils/define.hpp +++ /dev/null @@ -1,3 +0,0 @@ -#pragma once - -#define PGXX() pgxx::manager::instance() diff --git a/src/pgxx/utils/using.hpp b/src/pgxx/utils/using.hpp deleted file mode 100644 index 8bf172e..0000000 --- a/src/pgxx/utils/using.hpp +++ /dev/null @@ -1,8 +0,0 @@ -#pragma once - -#include "nlohmann/json.hpp" - -namespace pgxx -{ - using JSON = nlohmann::json; -} diff --git a/tests/main.cpp b/tests/main.cpp index 3aa3747..2a0366e 100644 --- a/tests/main.cpp +++ b/tests/main.cpp @@ -1,7 +1,177 @@ -#include +#include #include +#include #include "pgxx/pgxx.hpp" +#include "thread/pool.hpp" + +const int MAX_QUERY_IN_DB = 10'000; +const float MAX_OVERLAP = 12.f; + +struct bit +{ + std::string m_id; + std::string m_url; + std::string m_artist; + std::string m_song; + std::vector m_key; + std::vector m_duration; +}; + +bit target; + +std::vector parse_array(const std::string& arr_str) +{ + std::vector result; + std::stringstream ss(arr_str); + std::string item; + + while (std::getline(ss, item, ',')) + { + try + { + result.push_back(std::stoi(item)); + } + catch (const std::invalid_argument&) + { + std::cerr << "Ошибка преобразования: " << item << std::endl; + } + } + return result; +} + +namespace calc +{ + inline int calculation(int db_offset) + { + std::vector vb; + vb.reserve(MAX_QUERY_IN_DB); + + std::string query = "SELECT * FROM t_media LIMIT " + std::to_string(MAX_QUERY_IN_DB) + " OFFSET " + std::to_string(db_offset); + auto r = PGXX().execute("con_1", query); + + for (auto el : r) + { + bit b; + + b.m_id = el["m_id"].as(); + b.m_url = el["m_url"].as(); + b.m_artist = el["m_artist"].as(); + b.m_song = el["m_song"].as(); + + std::string str = el["m_key"].as(); + b.m_key = parse_array(str); + + str = el["m_duration"].as(); + b.m_duration = parse_array(str); + vb.push_back(b); + } + + return vb.size(); + } +} + +namespace executor +{ + inline void get_recomended() + { + try + { + int count = 0; + std::string query = "SELECT count(*) FROM t_media WHERE m_cleared = 0;"; + auto r = PGXX().execute("con_1", query); + for (auto eld : r) count = eld["count"].as(); + + thread::pool pool; + + auto start = std::chrono::high_resolution_clock::now(); + int i = 0; + int def = count / MAX_QUERY_IN_DB + 1; + int db_offset = 0; + + std::vector> futures; + futures.reserve(def); + + while (def > 0) + { + futures.push_back(pool.enqueue(calc::calculation, db_offset)); + db_offset += MAX_QUERY_IN_DB; + --def; + } + + for (auto &f : futures) + { + int r = f.get(); + i += r; + } + + std::chrono::duration elapsed = std::chrono::high_resolution_clock::now() - start; + hack::log()(i, elapsed.count()); + } + catch(const std::exception& e) + { + hack::log()(e.what()); + throw; + } + catch(hack::exception& ex) + { + ex.log(); + throw; + } + catch(...) + { + hack::log()("ooops!"); + throw; + } + } +} + +void convert_db() +{ + bool is_work = true; + int count = 0; + while (is_work) + { + try + { + std::string query = "SELECT * FROM t_media WHERE m_cleared = 0 LIMIT " + std::to_string(1) + ";"; + auto r = PGXX().execute("con_1", query); + hack::log("")("size = ", r.size(), ", count = ", count); + + for (auto el : r) + { + target.m_id = el["m_id"].as(); + target.m_url = el["m_url"].as(); + target.m_artist = el["m_artist"].as(); + target.m_song = el["m_song"].as(); + + std::string key = el["m_key"].as(); + std::string duration = el["m_duration"].as(); + + query = "UPDATE t_media SET m_cleared = 1 WHERE m_id = '" + target.m_id + "';"; + PGXX().execute("con_1", query); + + executor::get_recomended(); + } + + query = "SELECT count(*) FROM t_media WHERE m_cleared = 0;"; + r = PGXX().execute("con_1", query); + + for (auto eld : r) + { + auto c = eld["count"].as(); + if (count - c > 1) hack::log()("DOUBLE"); + count = c; + } + + if (count == 0) is_work = false; + } + catch(hack::exception& e) + { + e.log(); + } + } +} auto main(int argc, char* args[]) -> int { @@ -10,7 +180,6 @@ auto main(int argc, char* args[]) -> int try { PGXX().init("con_1", 300, con); - PGXX().init("con_2", 300, con); } catch(hack::exception& ex) { @@ -21,24 +190,5 @@ auto main(int argc, char* args[]) -> int if (!PGXX().ready()) hack::log()("error connection"); - pgxx::JSON j { - { - "params", { { "key_1", 1 }, { "key2", "value" } } - } - }; - - for (auto i = 0; i < 10; ++i) - { - std::thread th([&j](){ - auto r = PGXX().execute("con_1", "read_and_write", j); - }); - th.detach(); - } - - for (auto i = 0; i < 10; ++i) - { - auto r = PGXX().execute("con_2", "read_and_write", j); - } - - hack::log()("ok"); + convert_db(); } diff --git a/tests/thread/pool.hpp b/tests/thread/pool.hpp new file mode 100644 index 0000000..e265417 --- /dev/null +++ b/tests/thread/pool.hpp @@ -0,0 +1,288 @@ +#pragma once + +#include +#include +#include +#include +#include +#include +#include +#include +#include + +#include "queue.hpp" + +namespace thread +{ + namespace details + { + using default_function_type = std::function; + } + + template + requires std::invocable && std::is_same_v> + class pool + { + public: + template > + requires std::invocable && std::is_same_v> + explicit pool(const unsigned int& number_of_threads = std::thread::hardware_concurrency(), InitializationFunction init = [](std::size_t) {}) : tasks_(number_of_threads) + { + std::size_t current_id = 0; + for (std::size_t i = 0; i < number_of_threads; ++i) + { + priority_queue_.push_back(size_t(current_id)); + try + { + threads_.emplace_back([&, id = current_id, init](const std::stop_token &stop_tok) { + // invoke the init function on the thread + try + { + std::invoke(init, id); + } + catch (...) + { + // suppress exceptions + } + + do + { + // wait until signaled + tasks_[id].signal.acquire(); + do + { + // invoke the task + while (auto task = tasks_[id].tasks.pop_front()) + { + // decrement the unassigned tasks as the task is now going + // to be executed + unassigned_tasks_.fetch_sub(1, std::memory_order_release); + // invoke the task + std::invoke(std::move(task.value())); + // the above task can push more work onto the pool, so we + // only decrement the in flights once the task has been + // executed because now it's now longer "in flight" + in_flight_tasks_.fetch_sub(1, std::memory_order_release); + } + + // try to steal a task + for (std::size_t j = 1; j < tasks_.size(); ++j) + { + const std::size_t index = (id + j) % tasks_.size(); + if (auto task = tasks_[index].tasks.steal()) + { + // steal a task + unassigned_tasks_.fetch_sub(1, std::memory_order_release); + std::invoke(std::move(task.value())); + in_flight_tasks_.fetch_sub(1, std::memory_order_release); + // stop stealing once we have invoked a stolen task + break; + } + } + // check if there are any unassigned tasks before rotating to the + // front and waiting for more work + } while (unassigned_tasks_.load(std::memory_order_acquire) > 0); + + priority_queue_.rotate_to_front(id); + // check if all tasks are completed and release the "barrier" + if (in_flight_tasks_.load(std::memory_order_acquire) == 0) + { + // in theory, only one thread will set this + threads_complete_signal_.store(true, std::memory_order_release); + threads_complete_signal_.notify_one(); + } + } while (!stop_tok.stop_requested()); + }); + // increment the thread id + ++current_id; + } + catch (...) + { + tasks_.pop_back(); + std::ignore = priority_queue_.pop_back(); + } + } + } + + ~pool() + { + wait_for_tasks(); + // stop all threads + for (std::size_t i = 0; i < threads_.size(); ++i) + { + threads_[i].request_stop(); + tasks_[i].signal.release(); + threads_[i].join(); + } + } + + /// thread pool is non-copyable + pool(const pool &) = delete; + pool &operator=(const pool &) = delete; + + /** + * @brief Enqueue a task into the thread pool that returns a result. + * @details Note that task execution begins once the task is enqueued. + * @tparam Function An invokable type. + * @tparam Args Argument parameter pack + * @tparam ReturnType The return type of the Function + * @param f The callable function + * @param args The parameters that will be passed (copied) to the function. + * @return A std::future that can be used to retrieve the returned value. + */ + template > + requires std::invocable + [[nodiscard]] std::future enqueue(Function f, Args... args) + { + /* + * use shared promise here so that we don't break the promise later (until C++23) + * + * with C++23 we can do the following: + * + * std::promise promise; + * auto future = promise.get_future(); + * auto task = [func = std::move(f), ...largs = std::move(args), + promise = std::move(promise)]() mutable {...}; + */ + auto shared_promise = std::make_shared>(); + auto task = [func = std::move(f), ... largs = std::move(args), promise = shared_promise]() { + try + { + if constexpr (std::is_same_v) + { + func(largs...); + promise->set_value(); + } + else + { + promise->set_value(func(largs...)); + } + + } + catch (...) + { + promise->set_exception(std::current_exception()); + } + }; + + // get the future before enqueuing the task + auto future = shared_promise->get_future(); + // enqueue the task + enqueue_task(std::move(task)); + return future; + } + + /** + * @brief Enqueue a task to be executed in the thread pool. Any return value of the function + * will be ignored. + * @tparam Function An invokable type. + * @tparam Args Argument parameter pack for Function + * @param func The callable to be executed + * @param args Arguments that will be passed to the function. + */ + template + requires std::invocable + void enqueue_detach(Function &&func, Args &&...args) + { + enqueue_task(std::move([f = std::forward(func), ... largs = std::forward(args)]() mutable -> decltype(auto) { + // suppress exceptions + try + { + if constexpr (std::is_same_v>) + { + std::invoke(f, largs...); + } + else + { + // the function returns an argument, but can be ignored + std::ignore = std::invoke(f, largs...); + } + } + catch (...) + { + } + })); + } + + /** + * @brief Returns the number of threads in the pool. + * + * @return std::size_t The number of threads in the pool. + */ + [[nodiscard]] auto size() const { return threads_.size(); } + + /** + * @brief Wait for all tasks to finish. + * @details This function will block until all tasks have been completed. + */ + void wait_for_tasks() + { + if (in_flight_tasks_.load(std::memory_order_acquire) > 0) + { + // wait for all tasks to finish + threads_complete_signal_.wait(false); + } + } + + /** + * @brief Makes best-case attempt to clear all tasks from the thread_pool + * @details Note that this does not guarantee that all tasks will be cleared, as currently + * running tasks could add additional tasks. Also a thread could steal a task from another + * in the middle of this. + * @return number of tasks cleared + */ + size_t clear_tasks() + { + size_t removed_task_count{0}; + for (auto &task_list : tasks_) + { + removed_task_count += task_list.tasks.clear(); + } + in_flight_tasks_.fetch_sub(removed_task_count, std::memory_order_release); + unassigned_tasks_.fetch_sub(removed_task_count, std::memory_order_release); + + return removed_task_count; + } + + private: + template + void enqueue_task(Function &&f) + { + auto i_opt = priority_queue_.copy_front_and_rotate_to_back(); + if (!i_opt.has_value()) + { + // would only be a problem if there are zero threads + return; + } + // get the index + auto i = *(i_opt); + + // increment the unassigned tasks and in flight tasks + unassigned_tasks_.fetch_add(1, std::memory_order_release); + const auto prev_in_flight = in_flight_tasks_.fetch_add(1, std::memory_order_release); + + // reset the in flight signal if the list was previously empty + if (prev_in_flight == 0) + { + threads_complete_signal_.store(false, std::memory_order_release); + } + + // assign work + tasks_[i].tasks.push_back(std::forward(f)); + tasks_[i].signal.release(); + } + + struct task_item + { + queue tasks{}; + std::binary_semaphore signal{0}; + }; + + std::vector threads_; + std::deque tasks_; + queue priority_queue_; + // guarantee these get zero-initialized + std::atomic_int_fast64_t unassigned_tasks_{0}, in_flight_tasks_{0}; + std::atomic_bool threads_complete_signal_{false}; + }; +} diff --git a/tests/thread/queue.hpp b/tests/thread/queue.hpp new file mode 100644 index 0000000..7681c0a --- /dev/null +++ b/tests/thread/queue.hpp @@ -0,0 +1,108 @@ +#pragma once + +#include +#include +#include +#include + +namespace thread +{ + template + class queue + { + public: + using value_type = T; + using size_type = typename std::deque::size_type; + + public: + queue() = default; + + void push_back(T&& value) + { + std::scoped_lock lock(m_mutex); + m_data.push_back(std::forward(value)); + } + + void push_front(T&& value) + { + std::scoped_lock lock(m_mutex); + m_data.push_front(std::forward(value)); + } + + [[nodiscard]] bool empty() const + { + std::scoped_lock lock(m_mutex); + return m_data.empty(); + } + + size_type clear() + { + std::scoped_lock lock(m_mutex); + auto size = m_data.size(); + m_data.clear(); + + return size; + } + + [[nodiscard]] std::optional pop_front() + { + std::scoped_lock lock(m_mutex); + if (m_data.empty()) return std::nullopt; + + auto front = std::move(m_data.front()); + m_data.pop_front(); + return front; + } + + [[nodiscard]] std::optional pop_back() + { + std::scoped_lock lock(m_mutex); + if (m_data.empty()) return std::nullopt; + + auto back = std::move(m_data.back()); + m_data.pop_back(); + return back; + } + + [[nodiscard]] std::optional steal() + { + std::scoped_lock lock(m_mutex); + if (m_data.empty()) return std::nullopt; + + auto back = std::move(m_data.back()); + m_data.pop_back(); + return back; + } + + void rotate_to_front(const T& item) + { + std::scoped_lock lock(m_mutex); + auto iter = std::find(m_data.begin(), m_data.end(), item); + + if (iter != m_data.end()) + { + std::ignore = m_data.erase(iter); + } + + m_data.push_front(item); + } + + [[nodiscard]] std::optional copy_front_and_rotate_to_back() + { + std::scoped_lock lock(m_mutex); + + if (m_data.empty()) return std::nullopt; + + auto front = m_data.front(); + m_data.pop_front(); + + m_data.push_back(front); + + return front; + } + + private: + std::deque m_data{}; + std::mutex m_mutex{}; + }; +}