From 819d2d80e0524dbd9bf1616e0db08818100af7a1 Mon Sep 17 00:00:00 2001 From: Přemysl Eric Janouch Date: Thu, 18 Jan 2024 01:24:15 +0100 Subject: Limit concurrency to number of hardware threads --- deeptagger/deeptagger.cpp | 10 +++++++--- 1 file changed, 7 insertions(+), 3 deletions(-) (limited to 'deeptagger') diff --git a/deeptagger/deeptagger.cpp b/deeptagger/deeptagger.cpp index 103047b..cb28d92 100644 --- a/deeptagger/deeptagger.cpp +++ b/deeptagger/deeptagger.cpp @@ -598,7 +598,11 @@ infer(Ort::Env &env, const char *path, const std::vector &images) Thumbnailing ctx; for (const auto &path : images) ctx.input.push(path); - for (auto i = g.batch; i--; ) + + auto workers = g.batch; + if (auto threads = std::thread::hardware_concurrency()) + workers = std::min(workers, long(threads)); + for (auto i = workers; i--; ) std::thread(thumbnail, std::ref(config), *width, *height, std::ref(ctx)).detach(); @@ -610,7 +614,7 @@ infer(Ort::Env &env, const char *path, const std::vector &images) std::unique_lock output_lock(ctx.output_mutex); ctx.output_cv.wait(output_lock, - [&]{ return ctx.output.size() == g.batch || ctx.done == g.batch; }); + [&]{ return ctx.output.size() == g.batch || ctx.done == workers; }); // It would be possible to add dummy entries to the batch, // so that the model doesn't need to be rebuilt. @@ -618,7 +622,7 @@ infer(Ort::Env &env, const char *path, const std::vector &images) run(ctx.output, config, session, shape); ctx.output.clear(); } - if (ctx.done == g.batch) + if (ctx.done == workers) break; } } -- cgit v1.2.3-70-g09d2