229 lines
6.5 KiB
C++
229 lines
6.5 KiB
C++
#include "server/worker_pool.h"
|
|
|
|
#include <csignal>
|
|
#include <string>
|
|
|
|
#include "eventide/ipc/transport.h"
|
|
#include "support/logging.h"
|
|
|
|
namespace clice {
|
|
|
|
namespace {
|
|
|
|
/// Coroutine that reads lines from a worker's stderr pipe and logs them
|
|
/// with a prefix like [SL-0] or [SF-1].
|
|
et::task<> drain_stderr(et::pipe stderr_pipe, std::string prefix) {
|
|
std::string buffer;
|
|
while(true) {
|
|
auto result = co_await stderr_pipe.read();
|
|
if(!result.has_value()) {
|
|
// EOF or error — worker has exited
|
|
break;
|
|
}
|
|
auto& chunk = result.value();
|
|
if(chunk.empty())
|
|
break;
|
|
|
|
buffer += chunk;
|
|
|
|
// Log complete lines
|
|
std::size_t pos = 0;
|
|
while(true) {
|
|
auto nl = buffer.find('\n', pos);
|
|
if(nl == std::string::npos)
|
|
break;
|
|
auto line = buffer.substr(pos, nl - pos);
|
|
if(!line.empty()) {
|
|
LOG_INFO("{} {}", prefix, line);
|
|
}
|
|
pos = nl + 1;
|
|
}
|
|
buffer.erase(0, pos);
|
|
}
|
|
|
|
// Flush any remaining partial line
|
|
if(!buffer.empty()) {
|
|
LOG_INFO("{} {}", prefix, buffer);
|
|
}
|
|
}
|
|
|
|
} // namespace
|
|
|
|
bool WorkerPool::spawn_worker(const std::string& self_path,
|
|
bool stateful,
|
|
std::uint64_t memory_limit) {
|
|
et::process::options opts;
|
|
opts.file = self_path;
|
|
if(stateful) {
|
|
opts.args = {self_path,
|
|
"--mode",
|
|
"stateful-worker",
|
|
"--worker-memory-limit",
|
|
std::to_string(memory_limit)};
|
|
} else {
|
|
opts.args = {self_path, "--mode", "stateless-worker"};
|
|
}
|
|
opts.streams = {
|
|
et::process::stdio::pipe(true, false), // stdin: child reads
|
|
et::process::stdio::pipe(false, true), // stdout: child writes
|
|
et::process::stdio::pipe(false, true), // stderr: child writes
|
|
};
|
|
|
|
auto result = et::process::spawn(opts, loop);
|
|
if(!result) {
|
|
LOG_ERROR("Failed to spawn {} worker: {}",
|
|
stateful ? "stateful" : "stateless",
|
|
result.error().message());
|
|
return false;
|
|
}
|
|
|
|
auto& spawn = *result;
|
|
|
|
// StreamTransport: input = child's stdout (parent reads), output = child's stdin (parent
|
|
// writes)
|
|
auto transport = std::make_unique<et::ipc::StreamTransport>(std::move(spawn.stdout_pipe),
|
|
std::move(spawn.stdin_pipe));
|
|
auto peer = std::make_unique<et::ipc::BincodePeer>(loop, std::move(transport));
|
|
|
|
auto& workers = stateful ? stateful_workers : stateless_workers;
|
|
auto worker_index = workers.size();
|
|
|
|
// Build log prefix: [SF-0] for stateful, [SL-0] for stateless
|
|
std::string prefix =
|
|
std::string("[") + (stateful ? "SF-" : "SL-") + std::to_string(worker_index) + "]";
|
|
|
|
// Schedule stderr log collection
|
|
loop.schedule(drain_stderr(std::move(spawn.stderr_pipe), prefix));
|
|
|
|
workers.push_back(WorkerProcess{
|
|
.proc = std::move(spawn.proc),
|
|
.peer = std::move(peer),
|
|
.owned_documents = 0,
|
|
});
|
|
|
|
auto& w = workers.back();
|
|
loop.schedule(w.peer->run());
|
|
|
|
return true;
|
|
}
|
|
|
|
bool WorkerPool::start(const WorkerPoolOptions& options) {
|
|
for(std::uint32_t i = 0; i < options.stateless_count; ++i) {
|
|
if(!spawn_worker(options.self_path, false, 0)) {
|
|
return false;
|
|
}
|
|
}
|
|
|
|
for(std::uint32_t i = 0; i < options.stateful_count; ++i) {
|
|
if(!spawn_worker(options.self_path, true, options.worker_memory_limit)) {
|
|
return false;
|
|
}
|
|
}
|
|
|
|
// Register evicted notification handler for each stateful worker
|
|
for(std::size_t i = 0; i < stateful_workers.size(); ++i) {
|
|
stateful_workers[i].peer->on_notification([this](const worker::EvictedParams& params) {
|
|
if(on_evicted) {
|
|
on_evicted(params.path);
|
|
}
|
|
});
|
|
}
|
|
|
|
LOG_INFO("WorkerPool started: {} stateless, {} stateful workers",
|
|
stateless_workers.size(),
|
|
stateful_workers.size());
|
|
return true;
|
|
}
|
|
|
|
et::task<> WorkerPool::stop() {
|
|
LOG_INFO("WorkerPool stopping...");
|
|
|
|
// Close output pipes to signal workers to exit gracefully
|
|
for(auto& w: stateless_workers) {
|
|
w.peer->close_output();
|
|
}
|
|
for(auto& w: stateful_workers) {
|
|
w.peer->close_output();
|
|
}
|
|
|
|
// Send SIGTERM to all workers
|
|
for(auto& w: stateless_workers) {
|
|
w.proc.kill(SIGTERM);
|
|
}
|
|
for(auto& w: stateful_workers) {
|
|
w.proc.kill(SIGTERM);
|
|
}
|
|
|
|
// Wait for all worker processes to exit
|
|
for(auto& w: stateless_workers) {
|
|
co_await w.proc.wait();
|
|
}
|
|
for(auto& w: stateful_workers) {
|
|
co_await w.proc.wait();
|
|
}
|
|
|
|
LOG_INFO("WorkerPool stopped");
|
|
}
|
|
|
|
std::size_t WorkerPool::assign_worker(std::uint32_t path_id) {
|
|
auto it = owner.find(path_id);
|
|
if(it != owner.end()) {
|
|
// Already assigned; touch LRU
|
|
auto lru_it = owner_lru_index.find(path_id);
|
|
if(lru_it != owner_lru_index.end()) {
|
|
owner_lru.erase(lru_it->second);
|
|
}
|
|
owner_lru.push_front(path_id);
|
|
owner_lru_index[path_id] = owner_lru.begin();
|
|
return it->second;
|
|
}
|
|
|
|
// New assignment: pick the least-loaded worker
|
|
auto selected = pick_least_loaded();
|
|
owner[path_id] = selected;
|
|
stateful_workers[selected].owned_documents++;
|
|
owner_lru.push_front(path_id);
|
|
owner_lru_index[path_id] = owner_lru.begin();
|
|
return selected;
|
|
}
|
|
|
|
std::size_t WorkerPool::pick_least_loaded() {
|
|
std::size_t best = 0;
|
|
for(std::size_t i = 1; i < stateful_workers.size(); ++i) {
|
|
if(stateful_workers[i].owned_documents < stateful_workers[best].owned_documents) {
|
|
best = i;
|
|
}
|
|
}
|
|
return best;
|
|
}
|
|
|
|
void WorkerPool::remove_owner(std::uint32_t path_id) {
|
|
auto it = owner.find(path_id);
|
|
if(it == owner.end())
|
|
return;
|
|
|
|
auto worker_idx = it->second;
|
|
stateful_workers[worker_idx].owned_documents--;
|
|
owner.erase(it);
|
|
|
|
auto lru_it = owner_lru_index.find(path_id);
|
|
if(lru_it != owner_lru_index.end()) {
|
|
owner_lru.erase(lru_it->second);
|
|
owner_lru_index.erase(lru_it);
|
|
}
|
|
}
|
|
|
|
void WorkerPool::clear_owner(std::size_t worker_index) {
|
|
llvm::SmallVector<std::uint32_t> to_remove;
|
|
for(auto& [pid, widx]: owner) {
|
|
if(widx == worker_index) {
|
|
to_remove.push_back(pid);
|
|
}
|
|
}
|
|
for(auto pid: to_remove) {
|
|
remove_owner(pid);
|
|
}
|
|
}
|
|
|
|
} // namespace clice
|