1 // The MIT License (MIT) 2 // 3 // Copyright (c) 2015 Sergey Makeev, Vadim Slyusarev 4 // 5 // Permission is hereby granted, free of charge, to any person obtaining a copy 6 // of this software and associated documentation files (the "Software"), to deal 7 // in the Software without restriction, including without limitation the rights 8 // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 9 // copies of the Software, and to permit persons to whom the Software is 10 // furnished to do so, subject to the following conditions: 11 // 12 // The above copyright notice and this permission notice shall be included in 13 // all copies or substantial portions of the Software. 14 // 15 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 18 // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20 // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 21 // THE SOFTWARE. 22 23 #include <MTScheduler.h> 24 #include <string.h> // for memset 25 26 namespace MT 27 { 28 29 #ifdef MT_INSTRUMENTED_BUILD 30 TaskScheduler::TaskScheduler(uint32 workerThreadsCount, WorkerThreadParams* workerParameters, IProfilerEventListener* listener) 31 #else 32 TaskScheduler::TaskScheduler(uint32 workerThreadsCount, WorkerThreadParams* workerParameters) 33 #endif 34 : roundRobinThreadIndex(0) 35 , startedThreadsCount(0) 36 { 37 38 #ifdef MT_INSTRUMENTED_BUILD 39 profilerEventListener = listener; 40 #endif 41 42 if (workerThreadsCount != 0) 43 { 44 threadsCount.StoreRelaxed( MT::Clamp(workerThreadsCount, (uint32)1, (uint32)MT_MAX_THREAD_COUNT) ); 45 } else 46 { 47 //query number of processor 48 threadsCount.StoreRelaxed( (uint32)MT::Clamp(Thread::GetNumberOfHardwareThreads() - 1, 1, (int)MT_MAX_THREAD_COUNT) ); 49 } 50 51 // create fiber pool (fibers with standard stack size) 52 for (uint32 i = 0; i < MT_MAX_STANDART_FIBERS_COUNT; i++) 53 { 54 FiberContext& context = standartFiberContexts[i]; 55 context.fiber.Create(MT_STANDART_FIBER_STACK_SIZE, FiberMain, &context); 56 standartFibersAvailable.Push( &context ); 57 } 58 59 // create fiber pool (fibers with extended stack size) 60 for (uint32 i = 0; i < MT_MAX_EXTENDED_FIBERS_COUNT; i++) 61 { 62 FiberContext& context = extendedFiberContexts[i]; 63 context.fiber.Create(MT_EXTENDED_FIBER_STACK_SIZE, FiberMain, &context); 64 extendedFibersAvailable.Push( &context ); 65 } 66 67 68 for (int16 i = 0; i < TaskGroup::MT_MAX_GROUPS_COUNT; i++) 69 { 70 if (i != TaskGroup::DEFAULT) 71 { 72 availableGroups.Push( TaskGroup(i) ); 73 } 74 } 75 76 #if MT_GROUP_DEBUG 77 groupStats[TaskGroup::DEFAULT].SetDebugIsFree(false); 78 #endif 79 80 // create worker thread pool 81 int32 totalThreadsCount = GetWorkersCount(); 82 for (int32 i = 0; i < totalThreadsCount; i++) 83 { 84 threadContext[i].SetThreadIndex(i); 85 threadContext[i].taskScheduler = this; 86 87 uint32 threadCore = i; 88 ThreadPriority::Type priority = ThreadPriority::DEFAULT; 89 if (workerParameters != nullptr) 90 { 91 const WorkerThreadParams& params = workerParameters[i]; 92 93 threadCore = params.core; 94 priority = params.priority; 95 } 96 97 threadContext[i].thread.Start( MT_SCHEDULER_STACK_SIZE, WorkerThreadMain, &threadContext[i], threadCore, priority); 98 } 99 } 100 101 102 TaskScheduler::~TaskScheduler() 103 { 104 int32 totalThreadsCount = GetWorkersCount(); 105 for (int32 i = 0; i < totalThreadsCount; i++) 106 { 107 threadContext[i].state.Store(internal::ThreadState::EXIT); 108 threadContext[i].hasNewTasksEvent.Signal(); 109 } 110 111 for (int32 i = 0; i < totalThreadsCount; i++) 112 { 113 threadContext[i].thread.Join(); 114 } 115 } 116 117 ConcurrentQueueLIFO<FiberContext*>* TaskScheduler::GetFibersStorage(MT::StackRequirements::Type stackRequirements) 118 { 119 ConcurrentQueueLIFO<FiberContext*>* availableFibers = nullptr; 120 switch(stackRequirements) 121 { 122 case MT::StackRequirements::STANDARD: 123 availableFibers = &standartFibersAvailable; 124 break; 125 case MT::StackRequirements::EXTENDED: 126 availableFibers = &extendedFibersAvailable; 127 break; 128 default: 129 MT_REPORT_ASSERT("Unknown stack requrements"); 130 } 131 132 return availableFibers; 133 } 134 135 FiberContext* TaskScheduler::RequestFiberContext(internal::GroupedTask& task) 136 { 137 FiberContext *fiberContext = task.awaitingFiber; 138 if (fiberContext) 139 { 140 task.awaitingFiber = nullptr; 141 return fiberContext; 142 } 143 144 145 MT::StackRequirements::Type stackRequirements = task.desc.stackRequirements; 146 147 ConcurrentQueueLIFO<FiberContext*>* availableFibers = GetFibersStorage(stackRequirements); 148 MT_VERIFY(availableFibers != nullptr, "Can't find fiber storage", return nullptr;); 149 150 if (!availableFibers->TryPopBack(fiberContext)) 151 { 152 MT_REPORT_ASSERT("Fibers pool is empty. Too many fibers running simultaneously."); 153 } 154 155 fiberContext->currentTask = task.desc; 156 fiberContext->currentGroup = task.group; 157 fiberContext->parentFiber = task.parentFiber; 158 fiberContext->stackRequirements = stackRequirements; 159 return fiberContext; 160 } 161 162 void TaskScheduler::ReleaseFiberContext(FiberContext* fiberContext) 163 { 164 MT_ASSERT(fiberContext, "Can't release nullptr Fiber. fiberContext is nullptr"); 165 166 MT::StackRequirements::Type stackRequirements = fiberContext->stackRequirements; 167 fiberContext->Reset(); 168 169 ConcurrentQueueLIFO<FiberContext*>* availableFibers = GetFibersStorage(stackRequirements); 170 MT_VERIFY(availableFibers != nullptr, "Can't find fiber storage", return;); 171 172 availableFibers->Push(fiberContext); 173 } 174 175 FiberContext* TaskScheduler::ExecuteTask(internal::ThreadContext& threadContext, FiberContext* fiberContext) 176 { 177 MT_ASSERT(threadContext.thread.IsCurrentThread(), "Thread context sanity check failed"); 178 179 MT_ASSERT(fiberContext, "Invalid fiber context"); 180 MT_ASSERT(fiberContext->currentTask.IsValid(), "Invalid task"); 181 182 // Set actual thread context to fiber 183 fiberContext->SetThreadContext(&threadContext); 184 185 // Update task status 186 fiberContext->SetStatus(FiberTaskStatus::RUNNED); 187 188 MT_ASSERT(fiberContext->GetThreadContext()->thread.IsCurrentThread(), "Thread context sanity check failed"); 189 190 const void* poolUserData = fiberContext->currentTask.userData; 191 TPoolTaskDestroy poolDestroyFunc = fiberContext->currentTask.poolDestroyFunc; 192 193 // Run current task code 194 Fiber::SwitchTo(threadContext.schedulerFiber, fiberContext->fiber); 195 196 // If task was done 197 FiberTaskStatus::Type taskStatus = fiberContext->GetStatus(); 198 if (taskStatus == FiberTaskStatus::FINISHED) 199 { 200 //destroy task (call dtor) for "fire and forget" type of task from TaskPool 201 if (poolDestroyFunc != nullptr) 202 { 203 poolDestroyFunc(poolUserData); 204 } 205 206 TaskGroup taskGroup = fiberContext->currentGroup; 207 208 TaskScheduler::TaskGroupDescription & groupDesc = threadContext.taskScheduler->GetGroupDesc(taskGroup); 209 210 // Update group status 211 int groupTaskCount = groupDesc.Dec(); 212 MT_ASSERT(groupTaskCount >= 0, "Sanity check failed!"); 213 if (groupTaskCount == 0) 214 { 215 // Signal pending threads that group work is finished. Group can be destroyed after this call. 216 groupDesc.Signal(); 217 218 fiberContext->currentGroup = TaskGroup::INVALID; 219 } 220 221 // Update total task count 222 int allGroupTaskCount = threadContext.taskScheduler->allGroups.Dec(); 223 MT_ASSERT(allGroupTaskCount >= 0, "Sanity check failed!"); 224 if (allGroupTaskCount == 0) 225 { 226 // Notify all tasks in all group finished 227 threadContext.taskScheduler->allGroups.Signal(); 228 } 229 230 FiberContext* parentFiberContext = fiberContext->parentFiber; 231 if (parentFiberContext != nullptr) 232 { 233 int childrenFibersCount = parentFiberContext->childrenFibersCount.DecFetch(); 234 MT_ASSERT(childrenFibersCount >= 0, "Sanity check failed!"); 235 236 if (childrenFibersCount == 0) 237 { 238 // This is a last subtask. Restore parent task 239 MT_ASSERT(threadContext.thread.IsCurrentThread(), "Thread context sanity check failed"); 240 MT_ASSERT(parentFiberContext->GetThreadContext() == nullptr, "Inactive parent should not have a valid thread context"); 241 242 // WARNING!! Thread context can changed here! Set actual current thread context. 243 parentFiberContext->SetThreadContext(&threadContext); 244 245 MT_ASSERT(parentFiberContext->GetThreadContext()->thread.IsCurrentThread(), "Thread context sanity check failed"); 246 247 // All subtasks is done. 248 // Exiting and return parent fiber to scheduler 249 return parentFiberContext; 250 } else 251 { 252 // Other subtasks still exist 253 // Exiting 254 return nullptr; 255 } 256 } else 257 { 258 // Task is finished and no parent task 259 // Exiting 260 return nullptr; 261 } 262 } 263 264 MT_ASSERT(taskStatus != FiberTaskStatus::RUNNED, "Incorrect task status") 265 return nullptr; 266 } 267 268 269 void TaskScheduler::FiberMain(void* userData) 270 { 271 FiberContext& fiberContext = *(FiberContext*)(userData); 272 for(;;) 273 { 274 MT_ASSERT(fiberContext.currentTask.IsValid(), "Invalid task in fiber context"); 275 MT_ASSERT(fiberContext.GetThreadContext(), "Invalid thread context"); 276 MT_ASSERT(fiberContext.GetThreadContext()->thread.IsCurrentThread(), "Thread context sanity check failed"); 277 278 fiberContext.currentTask.taskFunc( fiberContext, fiberContext.currentTask.userData ); 279 280 fiberContext.SetStatus(FiberTaskStatus::FINISHED); 281 282 #ifdef MT_INSTRUMENTED_BUILD 283 fiberContext.fiber.SetName("_idle"); 284 fiberContext.GetThreadContext()->NotifyTaskFinished(fiberContext.currentTask); 285 #endif 286 287 Fiber::SwitchTo(fiberContext.fiber, fiberContext.GetThreadContext()->schedulerFiber); 288 } 289 290 } 291 292 293 bool TaskScheduler::TryStealTask(internal::ThreadContext& threadContext, internal::GroupedTask & task, uint32 workersCount) 294 { 295 if (workersCount <= 1) 296 { 297 return false; 298 } 299 300 uint32 victimIndex = threadContext.random.Get(); 301 302 for (uint32 attempt = 0; attempt < workersCount; attempt++) 303 { 304 uint32 index = victimIndex % workersCount; 305 if (index == threadContext.workerIndex) 306 { 307 victimIndex++; 308 index = victimIndex % workersCount; 309 } 310 311 internal::ThreadContext& victimContext = threadContext.taskScheduler->threadContext[index]; 312 if (victimContext.queue.TryPopNewest(task)) 313 { 314 return true; 315 } 316 317 victimIndex++; 318 } 319 return false; 320 } 321 322 323 void TaskScheduler::WorkerThreadMain( void* userData ) 324 { 325 internal::ThreadContext& context = *(internal::ThreadContext*)(userData); 326 MT_ASSERT(context.taskScheduler, "Task scheduler must be not null!"); 327 328 #ifdef MT_INSTRUMENTED_BUILD 329 const char* threadNames[] = {"worker0","worker1","worker2","worker3","worker4","worker5","worker6","worker7","worker8","worker9","worker10","worker11","worker12"}; 330 if (context.workerIndex < MT_ARRAY_SIZE(threadNames)) 331 { 332 Thread::SetThreadName(threadNames[context.workerIndex]); 333 } else 334 { 335 Thread::SetThreadName("worker_thread"); 336 } 337 #endif 338 339 context.schedulerFiber.CreateFromCurrentThreadAndRun(context.thread, SchedulerFiberMain, userData); 340 } 341 342 343 void TaskScheduler::SchedulerFiberMain( void* userData ) 344 { 345 internal::ThreadContext& context = *(internal::ThreadContext*)(userData); 346 MT_ASSERT(context.taskScheduler, "Task scheduler must be not null!"); 347 348 #ifdef MT_INSTRUMENTED_BUILD 349 context.NotifyThreadCreate(context.workerIndex); 350 #endif 351 352 uint32 workersCount = context.taskScheduler->GetWorkersCount(); 353 int32 totalThreadsCount = context.taskScheduler->threadsCount.LoadRelaxed(); 354 355 context.taskScheduler->startedThreadsCount.IncFetch(); 356 357 //Simple spinlock until all threads is started and initialized 358 for(;;) 359 { 360 int32 initializedThreadsCount = context.taskScheduler->startedThreadsCount.Load(); 361 if (initializedThreadsCount == totalThreadsCount) 362 { 363 break; 364 } 365 366 // sleep some time until all other thread initialized 367 Thread::Sleep(1); 368 } 369 370 HardwareFullMemoryBarrier(); 371 372 #ifdef MT_INSTRUMENTED_BUILD 373 context.NotifyThreadStart(context.workerIndex); 374 #endif 375 376 while(context.state.Load() != internal::ThreadState::EXIT) 377 { 378 internal::GroupedTask task; 379 if (context.queue.TryPopOldest(task) || TryStealTask(context, task, workersCount) ) 380 { 381 // There is a new task 382 FiberContext* fiberContext = context.taskScheduler->RequestFiberContext(task); 383 MT_ASSERT(fiberContext, "Can't get execution context from pool"); 384 MT_ASSERT(fiberContext->currentTask.IsValid(), "Sanity check failed"); 385 MT_ASSERT(fiberContext->stackRequirements == task.desc.stackRequirements, "Sanity check failed"); 386 387 #ifdef MT_INSTRUMENTED_BUILD 388 fiberContext->fiber.SetName(task.desc.debugID); 389 #endif 390 391 while(fiberContext) 392 { 393 #ifdef MT_INSTRUMENTED_BUILD 394 context.NotifyTaskResumed(fiberContext->currentTask); 395 #endif 396 // prevent invalid fiber resume from child tasks, before ExecuteTask is done 397 fiberContext->childrenFibersCount.IncFetch(); 398 399 FiberContext* parentFiber = ExecuteTask(context, fiberContext); 400 401 FiberTaskStatus::Type taskStatus = fiberContext->GetStatus(); 402 403 //release guard 404 int childrenFibersCount = fiberContext->childrenFibersCount.DecFetch(); 405 406 // Can drop fiber context - task is finished 407 if (taskStatus == FiberTaskStatus::FINISHED) 408 { 409 MT_ASSERT( childrenFibersCount == 0, "Sanity check failed"); 410 context.taskScheduler->ReleaseFiberContext(fiberContext); 411 412 // If parent fiber is exist transfer flow control to parent fiber, if parent fiber is null, exit 413 fiberContext = parentFiber; 414 } else 415 { 416 MT_ASSERT( childrenFibersCount >= 0, "Sanity check failed"); 417 418 // No subtasks here and status is not finished, this mean all subtasks already finished before parent return from ExecuteTask 419 if (childrenFibersCount == 0) 420 { 421 MT_ASSERT(parentFiber == nullptr, "Sanity check failed"); 422 } else 423 { 424 // If subtasks still exist, drop current task execution. task will be resumed when last subtask finished 425 break; 426 } 427 428 // If task is in await state drop execution. task will be resumed when RestoreAwaitingTasks called 429 if (taskStatus == FiberTaskStatus::AWAITING_GROUP) 430 { 431 break; 432 } 433 } 434 } //while(fiberContext) 435 436 } else 437 { 438 #ifdef MT_INSTRUMENTED_BUILD 439 context.NotifyThreadIdleBegin(context.workerIndex); 440 #endif 441 442 // Queue is empty and stealing attempt failed 443 // Wait new events 444 context.hasNewTasksEvent.Wait(2000); 445 446 #ifdef MT_INSTRUMENTED_BUILD 447 context.NotifyThreadIdleEnd(context.workerIndex); 448 #endif 449 450 } 451 452 } // main thread loop 453 454 #ifdef MT_INSTRUMENTED_BUILD 455 context.NotifyThreadStop(context.workerIndex); 456 #endif 457 458 } 459 460 void TaskScheduler::RunTasksImpl(ArrayView<internal::TaskBucket>& buckets, FiberContext * parentFiber, bool restoredFromAwaitState) 461 { 462 // This storage is necessary to calculate how many tasks we add to different groups 463 int newTaskCountInGroup[TaskGroup::MT_MAX_GROUPS_COUNT]; 464 465 // Default value is 0 466 memset(&newTaskCountInGroup[0], 0, sizeof(newTaskCountInGroup)); 467 468 // Set parent fiber pointer 469 // Calculate the number of tasks per group 470 // Calculate total number of tasks 471 size_t count = 0; 472 for (size_t i = 0; i < buckets.Size(); ++i) 473 { 474 internal::TaskBucket& bucket = buckets[i]; 475 for (size_t taskIndex = 0; taskIndex < bucket.count; taskIndex++) 476 { 477 internal::GroupedTask & task = bucket.tasks[taskIndex]; 478 479 task.parentFiber = parentFiber; 480 481 int idx = task.group.GetValidIndex(); 482 MT_ASSERT(idx >= 0 && idx < TaskGroup::MT_MAX_GROUPS_COUNT, "Invalid index"); 483 newTaskCountInGroup[idx]++; 484 } 485 486 count += bucket.count; 487 } 488 489 // Increments child fibers count on parent fiber 490 if (parentFiber) 491 { 492 parentFiber->childrenFibersCount.AddFetch((int)count); 493 } 494 495 if (restoredFromAwaitState == false) 496 { 497 // Increase the number of active tasks in the group using data from temporary storage 498 for (size_t i = 0; i < TaskGroup::MT_MAX_GROUPS_COUNT; i++) 499 { 500 int groupNewTaskCount = newTaskCountInGroup[i]; 501 if (groupNewTaskCount > 0) 502 { 503 groupStats[i].Reset(); 504 groupStats[i].Add((uint32)groupNewTaskCount); 505 } 506 } 507 508 // Increments all task in progress counter 509 allGroups.Reset(); 510 allGroups.Add((uint32)count); 511 } else 512 { 513 // If task's restored from await state, counters already in correct state 514 } 515 516 // Add to thread queue 517 for (size_t i = 0; i < buckets.Size(); ++i) 518 { 519 int bucketIndex = roundRobinThreadIndex.IncFetch() % threadsCount.LoadRelaxed(); 520 internal::ThreadContext & context = threadContext[bucketIndex]; 521 522 internal::TaskBucket& bucket = buckets[i]; 523 524 for(;;) 525 { 526 bool res = context.queue.Add(bucket.tasks, bucket.count); 527 if (res == true) 528 { 529 break; 530 } 531 532 //Can't add new tasks onto the queue. Look like the job system is overloaded. Wait some time and try again. 533 //TODO: implement waiting until workers done using events. 534 Thread::Sleep(10); 535 } 536 537 context.hasNewTasksEvent.Signal(); 538 } 539 } 540 541 void TaskScheduler::RunAsync(TaskGroup group, const TaskHandle* taskHandleArray, uint32 taskHandleCount) 542 { 543 MT_ASSERT(!IsWorkerThread(), "Can't use RunAsync inside Task. Use FiberContext.RunAsync() instead."); 544 545 ArrayView<internal::GroupedTask> buffer(MT_ALLOCATE_ON_STACK(sizeof(internal::GroupedTask) * taskHandleCount), taskHandleCount); 546 547 uint32 bucketCount = MT::Min((uint32)GetWorkersCount(), taskHandleCount); 548 ArrayView<internal::TaskBucket> buckets(MT_ALLOCATE_ON_STACK(sizeof(internal::TaskBucket) * bucketCount), bucketCount); 549 550 internal::DistibuteDescriptions(group, taskHandleArray, buffer, buckets); 551 RunTasksImpl(buckets, nullptr, false); 552 } 553 554 bool TaskScheduler::WaitGroup(TaskGroup group, uint32 milliseconds) 555 { 556 MT_VERIFY(IsWorkerThread() == false, "Can't use WaitGroup inside Task. Use FiberContext.WaitGroupAndYield() instead.", return false); 557 558 TaskScheduler::TaskGroupDescription & groupDesc = GetGroupDesc(group); 559 560 return groupDesc.Wait(milliseconds); 561 } 562 563 bool TaskScheduler::WaitAll(uint32 milliseconds) 564 { 565 MT_VERIFY(IsWorkerThread() == false, "Can't use WaitAll inside Task.", return false); 566 567 return allGroups.Wait(milliseconds); 568 } 569 570 bool TaskScheduler::IsEmpty() 571 { 572 for (uint32 i = 0; i < MT_MAX_THREAD_COUNT; i++) 573 { 574 if (!threadContext[i].queue.IsEmpty()) 575 { 576 return false; 577 } 578 } 579 return true; 580 } 581 582 int32 TaskScheduler::GetWorkersCount() const 583 { 584 return threadsCount.LoadRelaxed(); 585 } 586 587 bool TaskScheduler::IsWorkerThread() const 588 { 589 for (uint32 i = 0; i < MT_MAX_THREAD_COUNT; i++) 590 { 591 if (threadContext[i].thread.IsCurrentThread()) 592 { 593 return true; 594 } 595 } 596 return false; 597 } 598 599 TaskGroup TaskScheduler::CreateGroup() 600 { 601 MT_ASSERT(IsWorkerThread() == false, "Can't use CreateGroup inside Task."); 602 603 TaskGroup group; 604 if (!availableGroups.TryPopBack(group)) 605 { 606 MT_REPORT_ASSERT("Group pool is empty"); 607 } 608 609 int idx = group.GetValidIndex(); 610 611 MT_ASSERT(groupStats[idx].GetDebugIsFree() == true, "Bad logic!"); 612 #if MT_GROUP_DEBUG 613 groupStats[idx].SetDebugIsFree(false); 614 #endif 615 616 return group; 617 } 618 619 void TaskScheduler::ReleaseGroup(TaskGroup group) 620 { 621 MT_ASSERT(IsWorkerThread() == false, "Can't use ReleaseGroup inside Task."); 622 MT_ASSERT(group.IsValid(), "Invalid group ID"); 623 624 int idx = group.GetValidIndex(); 625 626 MT_ASSERT(groupStats[idx].GetDebugIsFree() == false, "Group already released"); 627 #if MT_GROUP_DEBUG 628 groupStats[idx].SetDebugIsFree(true); 629 #endif 630 631 availableGroups.Push(group); 632 } 633 634 TaskScheduler::TaskGroupDescription & TaskScheduler::GetGroupDesc(TaskGroup group) 635 { 636 MT_ASSERT(group.IsValid(), "Invalid group ID"); 637 638 int idx = group.GetValidIndex(); 639 TaskScheduler::TaskGroupDescription & groupDesc = groupStats[idx]; 640 641 MT_ASSERT(groupDesc.GetDebugIsFree() == false, "Invalid group"); 642 return groupDesc; 643 } 644 } 645 646 647