|
|
@ -89,7 +89,6 @@ void* thread_function(void* argp) { |
|
|
|
|
|
|
|
template <typename path> |
|
|
|
std::vector<uint64_t> execute_dml_memcpy(std::vector<TaskData>& args, const uint64_t iterations) { |
|
|
|
std::vector<std::thread> threads; |
|
|
|
std::vector<uint64_t> timing; |
|
|
|
|
|
|
|
// initialize numa library
|
|
|
@ -98,7 +97,8 @@ std::vector<uint64_t> execute_dml_memcpy(std::vector<TaskData>& args, const uint |
|
|
|
// for each submitted task we link the semaphore
|
|
|
|
// and create the thread, passing the argument
|
|
|
|
|
|
|
|
for (uint64_t i = 0; i < iterations; i++) { |
|
|
|
for (uint64_t i = 0; i < iterations + 5; i++) { |
|
|
|
std::vector<std::thread> threads; |
|
|
|
std::promise<void> launch_promise; |
|
|
|
LAUNCH_ = launch_promise.get_future(); |
|
|
|
|
|
|
@ -117,7 +117,7 @@ std::vector<uint64_t> execute_dml_memcpy(std::vector<TaskData>& args, const uint |
|
|
|
|
|
|
|
const auto time_end = std::chrono::steady_clock::now(); |
|
|
|
|
|
|
|
timing.emplace_back(std::chrono::duration_cast<std::chrono::nanoseconds>(time_end - time_start).count()); |
|
|
|
if (i >= 5) timing.emplace_back(std::chrono::duration_cast<std::chrono::nanoseconds>(time_end - time_start).count()); |
|
|
|
} |
|
|
|
|
|
|
|
return timing; |