view src/parallel_execution/TaskManagerImpl.cbc @ 319:a15511b1a6e0

separate cuda.c, and USE_CUDA_MAIN_THREAD flag
author Shinji KONO <kono@ie.u-ryukyu.ac.jp>
date Wed, 15 Feb 2017 20:43:55 +0900
parents 51aa65676e37
children f23f6d0aa4e9
line wrap: on
line source

#include "../context.h"

#include <stdio.h>

void createWorkers(struct Context* context, TaskManager* taskManeger, TaskManagerImpl* taskManagerImpl);

TaskManager* createTaskManagerImpl(struct Context* context, int numCPU, int numGPU, int numIO) {
    struct TaskManager* taskManager = new TaskManager();
    // 0...numIO-1 IOProcessor 
    // numIO...numIO+numGPU-1 GPUProcessor
    // numIO+numGPU...numIO+numGPU+numCPU-1 CPUProcessor
    taskManager->io = 0;
    taskManager->gpu = numIO;
    taskManager->cpu = numIO+numGPU;
    taskManager->maxCPU = numIO+numGPU+numCPU;
    taskManager->createTask = C_createTask;
    taskManager->spawn = C_spawnTaskManager;
    taskManager->shutdown  = C_shutdownTaskManager;
    struct TaskManagerImpl* taskManagerImpl = new TaskManagerImpl();
    taskManagerImpl -> activeQueue = createSingleLinkedQueue(context);
    taskManagerImpl -> taskQueue = createSingleLinkedQueue(context);
    taskManagerImpl -> numWorker = taskManager->maxCPU;
    createWorkers(context, taskManager, taskManagerImpl);
    taskManager->taskManager = (union Data*)taskManagerImpl;
    return taskManager;
}

void createWorkers(struct Context* context, TaskManager* taskManager, TaskManagerImpl* taskManagerImpl) {
    int i = 0;
    taskManagerImpl->workers = (Worker**)ALLOC_ARRAY(context, Worker, taskManager->maxCPU);
    for (;i<taskManager->gpu;i++) {
        Queue* queue = createSynchronizedQueue(context);
        taskManagerImpl->workers[i] = (Worker*)createCPUWorker(context, i, queue);
    }
    for (;i<taskManager->cpu;i++) {
#ifdef USE_CUDAWorker
        Queue* queue = createSynchronizedQueue(context);
#ifndef USE_CUDA_MAIN_THREAD
        taskManagerImpl->workers[i] = (Worker*)createCUDAWorker(context, i, queue,0);
#else
        taskManagerImpl->workers[i] = (Worker*)queue;
#endif
#else
        Queue* queue = createSynchronizedQueue(context);
        taskManagerImpl->workers[i] = (Worker*)createCPUWorker(context, i, queue);
#endif        
    }
    for (;i<taskManager->maxCPU;i++) {
        Queue* queue = createSynchronizedQueue(context);
        taskManagerImpl->workers[i] = (Worker*)createCPUWorker(context, i, queue);
    }
}

__code createTask(struct TaskManager* taskManager) {
    taskManager->context = NEW(struct Context);
    initContext(taskManager->context);
    taskManager->context->taskManager = taskManager;
    goto meta(context, C_setWorker);
}

__code setWorker(struct TaskManagerImpl* taskManager, struct Context* task, __code next(...)) {
    task->workerId = taskManager->sendWorkerIndex;
    if(++taskManager->sendWorkerIndex >= taskManager->numWorker) {
        taskManager->sendWorkerIndex = 0;
    }
    goto next(...);
}

__code setWorker_stub(struct Context* context) {
    TaskManagerImpl* taskManager = (TaskManagerImpl*)GearImpl(context, TaskManager, taskManager);
    goto setWorker(context, taskManager, Gearef(context, TaskManager)->context, Gearef(context, TaskManager)->next);
}

__code spawnTaskManager(struct TaskManagerImpl* taskManager, struct Queue* queue, struct Context* task, __code next(...)) {
    if (task->idgCount == 0) {
        // enqueue activeQueue
        queue->queue = (union Data*)taskManager->activeQueue;
    } else {
        // enqueue waitQueue
        queue->queue = (union Data*)taskManager->taskQueue;
    }
    queue->data = (union Data*)task;
    queue->next = C_spawnTaskManager1;
    goto meta(context, queue->queue->Queue.put);
}

__code spawnTaskManager_stub(struct Context* context) {
    TaskManagerImpl* taskManager = (TaskManagerImpl*)GearImpl(context, TaskManager, taskManager);
    pthread_mutex_lock(&taskManager->mutex);
    goto spawnTaskManager(context,
                          taskManager,
                          Gearef(context, Queue),
                          Gearef(context, TaskManager)->context,
                          Gearef(context, TaskManager)->next);
}


__code spawnTaskManager1(struct TaskManagerImpl* taskManager) {
    pthread_mutex_unlock(&taskManager->mutex);
    goto meta(context, C_taskSend);
}

__code spawnTaskManager1_stub(struct Context* context) {
    TaskManagerImpl* taskManager = (TaskManagerImpl*)GearImpl(context, TaskManager, taskManager);
    goto spawnTaskManager1(context,
                           taskManager);
}

__code taskSend(struct TaskManagerImpl* taskManager, struct Queue* queue) {
    queue->queue = (union Data*)taskManager->activeQueue;
    queue->next = C_taskSend1;
    goto meta(context, taskManager->activeQueue->take);
}

__code taskSend1(struct TaskManagerImpl* taskManager, struct Queue* queue, struct Context* task, __code next(...)) {
    struct Queue* tasks = taskManager->workers[task->workerId]->tasks;
    queue->queue = (union Data*)tasks;
    queue->data = (union Data*)task;
    queue->next = next;
    goto meta(context, tasks->put);
}

__code taskSend1_stub(struct Context* context) {
    TaskManagerImpl* taskManager = (TaskManagerImpl*)GearImpl(context, TaskManager, taskManager);
    goto taskSend1(context, taskManager, Gearef(context, Queue), Gearef(context, TaskManager)->context, Gearef(context, TaskManager)->next);
}

__code shutdownTaskManager(struct LoopCounter* loopCounter, struct TaskManager* taskManager, struct TaskManagerImpl* taskManagerImpl, struct Queue* queue, __code next(...)) {
    int i = loopCounter->i;
    if (taskManager->cpu <= i && i < taskManager->maxCPU) {
        struct Queue* tasks = taskManagerImpl->workers[i]->tasks;
        queue->queue = (union Data*)tasks;
        queue->data = NULL;
        queue->next = C_shutdownTaskManager1;
        goto meta(context, tasks->put);
    }

    loopCounter->i = 0;
    goto meta(context, next);
}

__code shutdownTaskManager_stub(struct Context* context) {
    TaskManagerImpl* taskManagerImpl = (TaskManagerImpl*)GearImpl(context, TaskManager, taskManager);
    goto shutdownTaskManager(context, Gearef(context, LoopCounter), &Gearef(context, TaskManager)->taskManager->TaskManager, taskManagerImpl, Gearef(context, Queue), Gearef(context, TaskManager)->next);
}

__code shutdownTaskManager1(struct LoopCounter* loopCounter, TaskManagerImpl* taskManagerImpl) {
    int i = loopCounter->i;
    pthread_join(taskManagerImpl->workers[i]->worker->CPUWorker.thread, NULL);
    loopCounter->i++;
    goto meta(context, C_shutdownTaskManager);
}

__code shutdownTaskManager1_stub(struct Context* context) {
    TaskManagerImpl* taskManagerImpl = (TaskManagerImpl*)GearImpl(context, TaskManager, taskManager);
    goto shutdownTaskManager1(context, Gearef(context, LoopCounter), taskManagerImpl);
}