Allow injecting tasks into lokimq job queue

This allows mixing some outside task into the lokimq job queue for a category (queued up with native LMQ requests for that category) for use when there is some external process that is able to generate messages. For example, the most immediate use for this is to allow an HTTP server to handle incoming RPC requests and, as soon as they arrive, inject them into LokiMQ's queue for the "rpc" category so that native LMQ rpc requests and HTTP rpc requests share the same thread pool and queue. These injected jobs bypass all of LokiMQ's authentication and response mechanisms: that's up to the invoked callback itself to manage. Injected tasks are somewhat similar to batch jobs, but unlike batch jobs the are queued and prioritized as ordinary external LokiMQ requests. (Batch jobs, in contrast, have a higher scheduling priority, no queue limits, and typically a larger available thread pool).
2020-06-07 21:30:46 -03:00 · 2020-06-07 21:30:46 -03:00 · 932bbb33d7
parent 07b31bd8a1
commit 932bbb33d7
6 changed files with 233 additions and 26 deletions
--- a/lokimq/lokimq.cpp
+++ b/lokimq/lokimq.cpp
@ -349,30 +349,45 @@ void LokiMQ::set_general_threads(int threads) {
 LokiMQ::run_info& LokiMQ::run_info::load(category* cat_, std::string command_, ConnectionID conn_, Access access_, std::string remote_,
                std::vector<zmq::message_t> data_parts_, const std::pair<CommandCallback, bool>* callback_) {
-    is_batch_job = false;
+    reset();
    is_reply_job = false;
    is_tagged_thread_job = false;
    cat = cat_;
    command = std::move(command_);
    conn = std::move(conn_);
    access = std::move(access_);
    remote = std::move(remote_);
    data_parts = std::move(data_parts_);
-    callback = callback_;
+    to_run = callback_;
    return *this;
 }
 LokiMQ::run_info& LokiMQ::run_info::load(category* cat_, std::string command_, std::string remote_, std::function<void()> callback) {
    reset();
    is_injected = true;
    cat = cat_;
    command = std::move(command_);
    conn = {};
    access = {};
    remote = std::move(remote_);
    to_run = std::move(callback);
    return *this;
 }
 LokiMQ::run_info& LokiMQ::run_info::load(pending_command&& pending) {
    if (auto *f = std::get_if<std::function<void()>>(&pending.callback))
        return load(&pending.cat, std::move(pending.command), std::move(pending.remote), std::move(*f));
    assert(pending.callback.index() == 0);
    return load(&pending.cat, std::move(pending.command), std::move(pending.conn), std::move(pending.access),
-            std::move(pending.remote), std::move(pending.data_parts), pending.callback);
+            std::move(pending.remote), std::move(pending.data_parts), std::get<0>(pending.callback));
 }
 LokiMQ::run_info& LokiMQ::run_info::load(batch_job&& bj, bool reply_job, int tagged_thread) {
    reset();
    is_batch_job = true;
    is_reply_job = reply_job;
    is_tagged_thread_job = tagged_thread > 0;
    batch_jobno = bj.second;
-    batch = bj.first;
+    to_run = bj.first;
    return *this;
 }
--- a/lokimq/lokimq.h
+++ b/lokimq/lokimq.h
@ -596,6 +596,18 @@ private:
    bool proxy_check_auth(size_t conn_index, bool outgoing, const peer_info& peer,
            zmq::message_t& command, const cat_call_t& cat_call, std::vector<zmq::message_t>& data);
    struct injected_task {
        category& cat;
        std::string command;
        std::string remote;
        std::function<void()> callback;
    };
    /// Injects a external callback to be handled by a worker; this is the proxy side of
    /// inject_task().
    void proxy_inject_task(injected_task task);
    /// Set of active service nodes.
    pubkey_set active_service_nodes;
@ -607,20 +619,30 @@ private:
    void proxy_update_active_sns_clean(pubkey_set added, pubkey_set removed);
    /// Details for a pending command; such a command already has authenticated access and is just
-    /// waiting for a thread to become available to handle it.
+    /// waiting for a thread to become available to handle it.  This also gets used (via the
    /// `callback` variant) for injected external jobs to be able to integrate some external
    /// interface with the lokimq job queue.
    struct pending_command {
        category& cat;
        std::string command;
        std::vector<zmq::message_t> data_parts;
-        const std::pair<CommandCallback, bool>* callback;
+        std::variant<
            const std::pair<CommandCallback, bool>*, // Normal command callback
            std::function<void()> // Injected external callback
        > callback;
        ConnectionID conn;
        Access access;
        std::string remote;
        // Normal ctor for an actual lmq command being processed
        pending_command(category& cat, std::string command, std::vector<zmq::message_t> data_parts,
                const std::pair<CommandCallback, bool>* callback, ConnectionID conn, Access access, std::string remote)
            : cat{cat}, command{std::move(command)}, data_parts{std::move(data_parts)},
            callback{callback}, conn{std::move(conn)}, access{std::move(access)}, remote{std::move(remote)} {}
        // Ctor for an injected external command.
        pending_command(category& cat, std::string command, std::function<void()> callback, std::string remote)
            : cat{cat}, command{std::move(command)}, callback{std::move(callback)}, remote{std::move(remote)} {}
    };
    std::list<pending_command> pending_commands;
@ -635,9 +657,15 @@ private:
        bool is_batch_job = false;
        bool is_reply_job = false;
        bool is_tagged_thread_job = false;
        bool is_injected = false;
        // resets the job type bools, above.
        void reset() { is_batch_job = is_reply_job = is_tagged_thread_job = is_injected = false; }
        // If is_batch_job is false then these will be set appropriate (if is_batch_job is true then
-        // these shouldn't be accessed and likely contain stale data).
+        // these shouldn't be accessed and likely contain stale data).  Note that if the command is
        // an external, injected command then conn, access, conn_route, and data_parts will be
        // empty/default constructed.
        category *cat;
        std::string command;
        ConnectionID conn; // The connection (or SN pubkey) to reply on/to.
@ -649,10 +677,13 @@ private:
        // If is_batch_job true then these are set (if is_batch_job false then don't access these!):
        int batch_jobno; // >= 0 for a job, -1 for the completion job
-        union {
+        // The callback or batch job to run.  The first of these is for regular tasks, the second
-            const std::pair<CommandCallback, bool>* callback; // set if !is_batch_job
+        // for batch jobs, the third for injected external tasks.
-            detail::Batch* batch;                             // set if is_batch_job
+        std::variant<
-        };
+            const std::pair<CommandCallback, bool>*,
            detail::Batch*,
            std::function<void()>
        > to_run;
        // These belong to the proxy thread and must not be accessed by a worker:
        std::thread worker_thread;
@ -663,8 +694,12 @@ private:
        run_info& load(category* cat, std::string command, ConnectionID conn, Access access, std::string remote,
                std::vector<zmq::message_t> data_parts, const std::pair<CommandCallback, bool>* callback);
        /// Loads the run info with an injected external command
        run_info& load(category* cat, std::string command, std::string remote, std::function<void()> callback);
        /// Loads the run info with a stored pending command
        run_info& load(pending_command&& pending);
        /// Loads the run info with a batch job
        run_info& load(batch_job&& bj, bool reply_job = false, int tagged_thread = 0);
    };
@ -1091,6 +1126,32 @@ public:
    template <typename... T>
    void request(ConnectionID to, std::string_view cmd, ReplyCallback callback, const T&... opts);
    /** Injects an external task into the lokimq command queue.  This is used to allow connecting
     * non-LokiMQ requests into the LokiMQ thread pool as if they were ordinary requests, to be
     * scheduled as commands of an individual category.  For example, you might support rpc requests
     * via LokiMQ as `rpc.some_command` and *also* accept them over HTTP.  Using `inject_task()`
     * allows you to handle processing the request in the same thread pool with the same priority as
     * `rpc.*` commands.
     *
     * @param category - the category name that should handle the request for the purposes of
     * scheduling the job.  The category must have been added using add_category().  The category
     * can be an actual category with added commands, in which case the injected tasks are queued
     * along with LMQ requests for that category, or can have no commands to set up a distinct
     * category for the injected jobs.
     *
     * @param command - a command name; this is mainly used for debugging and does not need to
     * actually exist (and, in fact, is often less confusing if it does not).  It is recommended for
     * clarity purposes to use something that doesn't look like a typical command, for example
     * "(http)".
     *
     * @param remote - some free-form identifier of the remote connection.  For example, this could
     * be a remote IP address.  Can be blank if there is nothing suitable.
     *
     * @param callback - the function to call from a worker thread when the injected task is
     * processed.  Takes no arguments.
     */
    void inject_task(const std::string& category, std::string command, std::string remote, std::function<void()> callback);
    /// The key pair this LokiMQ was created with; if empty keys were given during construction then
    /// this returns the generated keys.
    const std::string& get_pubkey() const { return pubkey; }
--- a/lokimq/proxy.cpp
+++ b/lokimq/proxy.cpp
@ -263,6 +263,9 @@ void LokiMQ::proxy_control_message(std::vector<zmq::message_t>& parts) {
            LMQ_TRACE("proxy batch jobs");
            auto ptrval = bt_deserialize<uintptr_t>(data);
            return proxy_batch(reinterpret_cast<detail::Batch*>(ptrval));
        } else if (cmd == "INJECT") {
            LMQ_TRACE("proxy inject");
            return proxy_inject_task(detail::deserialize_object<injected_task>(bt_deserialize<uintptr_t>(data)));
        } else if (cmd == "SET_SNS") {
            return proxy_set_active_sns(data);
        } else if (cmd == "UPDATE_SNS") {
@ -684,5 +687,4 @@ void LokiMQ::proxy_process_queue() {
    }
 }
 }
--- a/lokimq/worker.cpp
+++ b/lokimq/worker.cpp
@ -92,13 +92,19 @@ void LokiMQ::worker_thread(unsigned int index, std::optional<std::string> tagged
        try {
            if (run.is_batch_job) {
                auto* batch = std::get<detail::Batch*>(run.to_run);
                if (run.batch_jobno >= 0) {
-                    LMQ_TRACE("worker thread ", worker_id, " running batch ", run.batch, "#", run.batch_jobno);
+                    LMQ_TRACE("worker thread ", worker_id, " running batch ", batch, "#", run.batch_jobno);
-                    run.batch->run_job(run.batch_jobno);
+                    batch->run_job(run.batch_jobno);
                } else if (run.batch_jobno == -1) {
-                    LMQ_TRACE("worker thread ", worker_id, " running batch ", run.batch, " completion");
+                    LMQ_TRACE("worker thread ", worker_id, " running batch ", batch, " completion");
-                    run.batch->job_completion();
+                    batch->job_completion();
                }
            } else if (run.is_injected) {
                auto& func = std::get<std::function<void()>>(run.to_run);
                LMQ_TRACE("worker thread ", worker_id, " invoking injected command ", run.command);
                func();
                func = nullptr;
            } else {
                message.conn = run.conn;
                message.access = run.access;
@ -107,7 +113,8 @@ void LokiMQ::worker_thread(unsigned int index, std::optional<std::string> tagged
                LMQ_TRACE("Got incoming command from ", message.remote, "/", message.conn, message.conn.route.empty() ? " (outgoing)" : " (incoming)");
-                if (run.callback->second /*is_request*/) {
+                auto& [callback, is_request] = *std::get<const std::pair<CommandCallback, bool>*>(run.to_run);
                if (is_request) {
                    message.reply_tag = {run.data_parts[0].data<char>(), run.data_parts[0].size()};
                    for (auto it = run.data_parts.begin() + 1; it != run.data_parts.end(); ++it)
                        message.data.emplace_back(it->data<char>(), it->size());
@ -117,7 +124,7 @@ void LokiMQ::worker_thread(unsigned int index, std::optional<std::string> tagged
                }
                LMQ_TRACE("worker thread ", worker_id, " invoking ", run.command, " callback with ", message.data.size(), " message parts");
-                run.callback->first(message);
+                callback(message);
            }
        }
        catch (const bt_deserialize_invalid& e) {
@ -194,16 +201,17 @@ void LokiMQ::proxy_worker_message(std::vector<zmq::message_t>& parts) {
                active--;
            }
            bool clear_job = false;
            auto* batch = std::get<detail::Batch*>(run.to_run);
            if (run.batch_jobno == -1) {
                // Returned from the completion function
                clear_job = true;
            } else {
-                auto [state, thread] = run.batch->job_finished();
+                auto [state, thread] = batch->job_finished();
                if (state == detail::BatchState::complete) {
                    if (thread == -1) { // run directly in proxy
                        LMQ_TRACE("Completion job running directly in proxy");
                        try {
-                            run.batch->job_completion(); // RUN DIRECTLY IN PROXY THREAD
+                            batch->job_completion(); // RUN DIRECTLY IN PROXY THREAD
                        } catch (const std::exception &e) {
                            // Raise these to error levels: the caller really shouldn't be doing
                            // anything non-trivial in an in-proxy completion function!
@ -219,7 +227,7 @@ void LokiMQ::proxy_worker_message(std::vector<zmq::message_t>& parts) {
                            : run.is_reply_job
                              ? reply_jobs
                              : batch_jobs;
-                        jobs.emplace(run.batch, -1);
+                        jobs.emplace(batch, -1);
                    }
                } else if (state == detail::BatchState::done) {
                    // No completion job
@ -229,9 +237,9 @@ void LokiMQ::proxy_worker_message(std::vector<zmq::message_t>& parts) {
            }
            if (clear_job) {
-                batches.erase(run.batch);
+                batches.erase(batch);
-                delete run.batch;
+                delete batch;
-                run.batch = nullptr;
+                run.to_run = static_cast<detail::Batch*>(nullptr);
            }
        } else {
            assert(run.cat->active_threads > 0);
@ -360,5 +368,38 @@ void LokiMQ::proxy_to_worker(size_t conn_index, std::vector<zmq::message_t>& par
    category.active_threads++;
 }
 void LokiMQ::inject_task(const std::string& category, std::string command, std::string remote, std::function<void()> callback) {
    if (!callback) return;
    auto it = categories.find(category);
    if (it == categories.end())
        throw std::out_of_range{"Invalid category `" + category + "': category does not exist"};
    detail::send_control(get_control_socket(), "INJECT", bt_serialize(detail::serialize_object(
                injected_task{it->second, std::move(command), std::move(remote), std::move(callback)})));
 }
 void LokiMQ::proxy_inject_task(injected_task task) {
    auto& category = task.cat;
    if (category.active_threads >= category.reserved_threads && active_workers() >= general_workers) {
        // No free worker slot, queue for later
        if (category.max_queue >= 0 && category.queued >= category.max_queue) {
            LMQ_LOG(warn, "No space to queue injected task ", task.command, "; already have ", category.queued,
                    "commands queued in that category (max ", category.max_queue, "); dropping task");
            return;
        }
        LMQ_LOG(debug, "No available free workers for injected task ", task.command, "; queuing for later");
        pending_commands.emplace_back(category, std::move(task.command), std::move(task.callback), std::move(task.remote));
        category.queued++;
        return;
    }
    auto& run = get_idle_worker();
    LMQ_TRACE("Forwarding incoming injected task ", task.command, " from ", task.remote, " to worker ", run.worker_routing_id);
    run.load(&category, std::move(task.command), std::move(task.remote), std::move(task.callback));
    proxy_run_worker(run);
    category.active_threads++;
 }
 }
--- a/tests/CMakeLists.txt
+++ b/tests/CMakeLists.txt
@ -10,6 +10,7 @@ set(LMQ_TEST_SRC
    test_commands.cpp
    test_encoding.cpp
    test_failures.cpp
    test_inject.cpp
    test_requests.cpp
    test_tagged_threads.cpp
    )
--- a/tests/test_inject.cpp
+++ b/tests/test_inject.cpp
@ -0,0 +1,87 @@
 #include "common.h"
 using namespace lokimq;
 TEST_CASE("injected external commands", "[injected]") {
    std::string listen = "tcp://127.0.0.1:4567";
    LokiMQ server{
        "", "", // generate ephemeral keys
        false, // not a service node
        [](auto) { return ""; },
        get_logger("S» "),
        LogLevel::trace
    };
    server.set_general_threads(1);
    server.listen_curve(listen);
    std::atomic<int> hellos = 0;
    std::atomic<bool> done = false;
    server.add_category("public", AuthLevel::none, 3);
    server.add_command("public", "hello", [&](Message& m) {
        hellos++;
        while (!done) std::this_thread::sleep_for(10ms);
    });
    server.start();
    LokiMQ client{get_logger("C» "), LogLevel::trace};
    client.start();
    std::atomic<bool> got{false};
    bool success = false;
    auto c = client.connect_remote(listen,
            [&](auto conn) { success = true; got = true; },
            [&](auto conn, std::string_view) { got = true; },
            server.get_pubkey());
    wait_for_conn(got);
    {
        auto lock = catch_lock();
        REQUIRE( got );
        REQUIRE( success );
    }
    // First make sure that basic message respects the 3 thread limit
    client.send(c, "public.hello");
    client.send(c, "public.hello");
    client.send(c, "public.hello");
    client.send(c, "public.hello");
    wait_for([&] { return hellos >= 3; });
    std::this_thread::sleep_for(20ms);
    {
        auto lock = catch_lock();
        REQUIRE( hellos == 3 );
    }
    done = true;
    wait_for([&] { return hellos >= 4; });
    {
        auto lock = catch_lock();
        REQUIRE( hellos == 4 );
    }
    // Now try injecting external commands
    done = false;
    hellos = 0;
    client.send(c, "public.hello");
    wait_for([&] { return hellos >= 1; });
    server.inject_task("public", "(injected)", "localhost", [&] { hellos += 10; while (!done) std::this_thread::sleep_for(10ms); });
    wait_for([&] { return hellos >= 11; });
    client.send(c, "public.hello");
    wait_for([&] { return hellos >= 12; });
    server.inject_task("public", "(injected)", "localhost", [&] { hellos += 10; while (!done) std::this_thread::sleep_for(10ms); });
    server.inject_task("public", "(injected)", "localhost", [&] { hellos += 10; while (!done) std::this_thread::sleep_for(10ms); });
    server.inject_task("public", "(injected)", "localhost", [&] { hellos += 10; while (!done) std::this_thread::sleep_for(10ms); });
    wait_for([&] { return hellos >= 12; });
    std::this_thread::sleep_for(20ms);
    {
        auto lock = catch_lock();
        REQUIRE( hellos == 12 );
    }
    done = true;
    wait_for([&] { return hellos >= 42; });
    {
        auto lock = catch_lock();
        REQUIRE( hellos == 42 );
    }
 }