HomeSort by relevance Sort by last modified time
    Searched refs:blockDim (Results 1 - 25 of 44) sorted by null

1 2

  /external/tensorflow/tensorflow/examples/adding_an_op/
cuda_op_kernel.cu.cc 21 for (int i = blockIdx.x * blockDim.x + threadIdx.x; i < N;
22 i += blockDim.x * gridDim.x) {
  /external/tensorflow/tensorflow/tools/ci_build/builds/user_ops/
cuda_op_kernel.cu.cc 21 for (int i = blockIdx.x * blockDim.x + threadIdx.x; i < N;
22 i += blockDim.x * gridDim.x) {
  /external/tensorflow/tensorflow/core/kernels/
concat_lib_gpu_impl.cu.cc 40 IntType gidx = blockIdx.x * blockDim.x + threadIdx.x;
42 for (; gidx < total_cols; gidx += blockDim.x * gridDim.x) {
43 IntType gidy = blockIdx.y * blockDim.y + threadIdx.y;
49 for (; gidy < total_rows; gidy += blockDim.y * gridDim.y) {
68 IntType gidx = blockIdx.x * blockDim.x + threadIdx.x;
76 IntType lidx = threadIdx.y * blockDim.x + threadIdx.x;
77 IntType blockSize = blockDim.x * blockDim.y;
96 for (; gidx < total_cols; gidx += blockDim.x * gridDim.x) {
107 IntType gidy = blockIdx.y * blockDim.y + threadIdx.y
    [all...]
split_lib_gpu.cu.cc 78 eigen_assert(blockDim.y == 1);
79 eigen_assert(blockDim.z == 1);
118 IntType gidx = blockIdx.x * blockDim.x + threadIdx.x;
126 IntType lidx = threadIdx.y * blockDim.x + threadIdx.x;
127 IntType blockSize = blockDim.x * blockDim.y;
146 for (; gidx < total_cols; gidx += blockDim.x * gridDim.x) {
157 IntType gidy = blockIdx.y * blockDim.y + threadIdx.y;
158 for (; gidy < total_rows; gidy += blockDim.y * gridDim.y)
173 eigen_assert(blockDim.y == 1)
    [all...]
check_numerics_op_gpu.cu.cc 39 const int32 thread_id = blockIdx.x * blockDim.x + threadIdx.x;
40 const int32 total_thread_count = gridDim.x * blockDim.x;
bucketize_op_gpu.cu.cc 46 int32 lidx = threadIdx.y * blockDim.x + threadIdx.x;
47 int32 blockSize = blockDim.x * blockDim.y;
bias_op_gpu.cu.cc 121 for (int32 index = threadIdx.x; index < bias_size; index += blockDim.x) {
126 for (int32 index = blockIdx.x * blockDim.x + threadIdx.x; index < nthreads;
127 index += blockDim.x * gridDim.x) {
133 for (int32 index = threadIdx.x; index < bias_size; index += blockDim.x) {
147 for (int32 index = threadIdx.x; index < kSDataSize; index += blockDim.x) {
158 for (int32 index = group_index * blockDim.x + threadIdx.x;
159 index < total_count; index += blockDim.x * group_size) {
random_op_gpu.cu.cc 134 const int32 thread_id = blockIdx.x * blockDim.x + threadIdx.x;
135 const int32 total_thread_count = gridDim.x * blockDim.x;
175 const int32 thread_id = blockIdx.x * blockDim.x + threadIdx.x;
176 const int32 total_thread_count = gridDim.x * blockDim.x;
  /external/eigen/unsupported/Eigen/CXX11/src/Tensor/
TensorReductionCuda.h 115 const Index thread_id = blockIdx.x * blockDim.x + threadIdx.x;
116 const Index num_threads = blockDim.x * gridDim.x;
192 eigen_assert(blockDim.x == 1);
205 const Index thread_id = blockIdx.x * blockDim.x + threadIdx.x;
206 const Index num_threads = blockDim.x * gridDim.x;
378 eigen_assert(blockDim.y == 1);
379 eigen_assert(blockDim.z == 1);
386 const Index input_col_blocks = divup<Index>(num_coeffs_to_reduce, blockDim.x * NumPerThread);
389 const Index num_threads = blockDim.x * gridDim.x;
390 const Index thread_id = blockIdx.x * blockDim.x + threadIdx.x
    [all...]
  /external/tensorflow/tensorflow/contrib/mpi_collectives/kernels/
ring.cu.cc 90 for (size_t i = blockIdx.x * blockDim.x + threadIdx.x; i < N;
91 i += blockDim.x * gridDim.x) {
  /external/tensorflow/tensorflow/core/util/
cuda_device_functions.h 90 return detail::CudaGridRange<T>(blockIdx.x * blockDim.x + threadIdx.x,
91 gridDim.x * blockDim.x, count);
98 return detail::CudaGridRange<T>(blockIdx.y * blockDim.y + threadIdx.y,
99 gridDim.y * blockDim.y, count);
106 return detail::CudaGridRange<T>(blockIdx.z * blockDim.z + threadIdx.z,
107 gridDim.z * blockDim.z, count);
386 assert(blockDim.y == 1 && blockDim.z == 1);
387 assert(blockDim.x * gridDim.x / blockDim.x == gridDim.x)
    [all...]
  /external/eigen/test/
cuda_common.h 11 dim3 threadIdx, blockDim, blockIdx;
26 int i = threadIdx.x + blockIdx.x*blockDim.x;
  /external/clang/lib/Headers/
cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/darwin-x86/clang-3289846/lib64/clang/3.8/include/
cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/darwin-x86/clang-3859424/lib64/clang/4.0/include/
__clang_cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/darwin-x86/clang-4053586/lib64/clang/5.0/include/
__clang_cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/darwin-x86/clang-4393122/lib64/clang/5.0.1/include/
__clang_cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/darwin-x86/clang-4479392/lib64/clang/5.0.2/include/
__clang_cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/darwin-x86/clang-4579689/lib64/clang/6.0.1/include/
__clang_cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/darwin-x86/clang-4630689/lib64/clang/6.0.1/include/
__clang_cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/darwin-x86/clang-4639204/lib64/clang/6.0.1/include/
__clang_cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/darwin-x86/clang-4691093/lib64/clang/6.0.2/include/
__clang_cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/linux-x86/clang-3289846/lib64/clang/3.8/include/
cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/linux-x86/clang-3859424/lib64/clang/4.0/include/
__clang_cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
  /prebuilts/clang/host/linux-x86/clang-4053586/lib64/clang/5.0/include/
__clang_cuda_builtin_vars.h 92 // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
114 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;

Completed in 781 milliseconds

1 2