From 819d2d80e0524dbd9bf1616e0db08818100af7a1 Mon Sep 17 00:00:00 2001
From: Přemysl Eric Janouch
Date: Thu, 18 Jan 2024 01:24:15 +0100
Subject: Limit concurrency to number of hardware threads
---
deeptagger/deeptagger.cpp | 10 +++++++---
1 file changed, 7 insertions(+), 3 deletions(-)
(limited to 'deeptagger/deeptagger.cpp')
diff --git a/deeptagger/deeptagger.cpp b/deeptagger/deeptagger.cpp
index 103047b..cb28d92 100644
--- a/deeptagger/deeptagger.cpp
+++ b/deeptagger/deeptagger.cpp
@@ -598,7 +598,11 @@ infer(Ort::Env &env, const char *path, const std::vector &images)
Thumbnailing ctx;
for (const auto &path : images)
ctx.input.push(path);
- for (auto i = g.batch; i--; )
+
+ auto workers = g.batch;
+ if (auto threads = std::thread::hardware_concurrency())
+ workers = std::min(workers, long(threads));
+ for (auto i = workers; i--; )
std::thread(thumbnail, std::ref(config), *width, *height,
std::ref(ctx)).detach();
@@ -610,7 +614,7 @@ infer(Ort::Env &env, const char *path, const std::vector &images)
std::unique_lock output_lock(ctx.output_mutex);
ctx.output_cv.wait(output_lock,
- [&]{ return ctx.output.size() == g.batch || ctx.done == g.batch; });
+ [&]{ return ctx.output.size() == g.batch || ctx.done == workers; });
// It would be possible to add dummy entries to the batch,
// so that the model doesn't need to be rebuilt.
@@ -618,7 +622,7 @@ infer(Ort::Env &env, const char *path, const std::vector &images)
run(ctx.output, config, session, shape);
ctx.output.clear();
}
- if (ctx.done == g.batch)
+ if (ctx.done == workers)
break;
}
}
--
cgit v1.2.3-70-g09d2