Skip to content

Commit

Permalink
add launch_bounds to greedy kernels
Browse files Browse the repository at this point in the history
  • Loading branch information
Natalia Gimelshein authored and soumith committed Jul 13, 2017
1 parent c3c0d9b commit 27d79db
Showing 1 changed file with 2 additions and 0 deletions.
2 changes: 2 additions & 0 deletions lib/THCUNN/VolumetricUpSamplingTrilinear.cu
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@
#include "THCAtomics.cuh"

template<typename Dtype, typename Acctype>
__launch_bounds__(1024)
__global__ void caffe_gpu_interp2_kernel(const int n,
const Acctype rdepth, const Acctype rheight, const Acctype rwidth,
const THCDeviceTensor<Dtype, 5> data1, THCDeviceTensor<Dtype, 5> data2) {
Expand Down Expand Up @@ -77,6 +78,7 @@ __global__ void caffe_gpu_interp2_kernel(const int n,

// Backward (adjoint) operation 1 <- 2 (accumulates)
template <typename Dtype, typename Acctype>
__launch_bounds__(1024)
__global__ void caffe_gpu_interp2_kernel_backward(const int n,
const Acctype rdepth, const Acctype rheight, const Acctype rwidth,
THCDeviceTensor<Dtype, 5> data1, const THCDeviceTensor<Dtype, 5> data2){
Expand Down

0 comments on commit 27d79db

Please sign in to comment.