hl_thread.ph 2.6 KB
Newer Older
Z
zhangjinchao01 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84
/* Copyright (c) 2016 Baidu, Inc. All Rights Reserve.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#ifndef HL_THREAD_PH_
#define HL_THREAD_PH_

#include <stdio.h>
#include <pthread.h>
#include <cuda.h>
#include <cuda_runtime.h>
#include <cublas_v2.h>
#include <curand.h>
#include <cudnn.h>
#include "hl_base.h"

/**
 * @brief   Thread resource structure.
 *
 * @param   stream[HPPL_STREAM_END] Stream for thread.
 * @param   handle                  Cublas Handle.
 * @param   gen                     Curand Generator.
 * @param   cudnn_handle            Cudnn handle.
 * @param   cudnn_desc              Cudnn image descriptor.
 * @param   *gen_mutex              Gen lock.
 * @param   *gpu_mem                HPPL GPU Memory.
 * @param   *cpu_mem                HPPL CPU Memory.
 * @param   event                   gpu_mem event.
 * @param   device                  Thread device context.
 * @param   major                   Compute capability.
 * @param   is_init                 Thread init or not.
 */
typedef struct {
    cudaStream_t             stream[HPPL_STREAM_END];
    cublasHandle_t           handle;
    curandGenerator_t        gen;
    cudnnHandle_t            cudnn_handle;
    cudnnTensorDescriptor_t  cudnn_desc;
    pthread_mutex_t          *gen_mutex;
    real                     *gpu_mem;
    real                     *cpu_mem;
    cudaEvent_t              event;
    int                      device;
    int                      major;
    bool                     is_init;
} _hl_thread_resource, *hl_thread_resource;

extern __thread _hl_thread_resource t_resource;

/**
 * @brief   Initialize cudnn.
 *
 * @param   cudnn_handle  Cudnn handle.
 * @param   stream        Cudnn stream.
 */
extern void hl_cudnn_init(cudnnHandle_t *cudnn_handle, cudaStream_t stream);

/**
 * @brief   Initialize cublas.
 *
 * @param   cublas_handle  Cublas handle.
 * @param   stream         Cuda stream.
 */
extern void hl_cublas_init(cublasHandle_t *cublas_handle, cudaStream_t stream);

/**
 * @brief   Initialize cudnn tensor descriptor.
 *
 * @param   cudnn_desc    Cudnn tensor descriptor.
 */

extern void hl_cudnn_desc_init(cudnnTensorDescriptor_t*  cudnn_desc);

#endif  /* HL_THREAD_PH_ */