Home
last modified time | relevance | path

Searched defs:smem (Results 1 – 25 of 35) sorted by relevance

12

/external/opencv3/modules/core/include/opencv2/core/cuda/
Demulation.hpp84 struct smem struct
86 enum { TAG_MASK = (1U << ( (sizeof(unsigned int) << 3) - 5U)) - 1U };
89 static __device__ __forceinline__ T atomicInc(T* address, T val) in atomicInc()
108 static __device__ __forceinline__ T atomicAdd(T* address, T val) in atomicAdd()
127 static __device__ __forceinline__ T atomicMin(T* address, T val) in atomicMin()
Dvec_distance.hpp160 …Global(const T1* vec1, const T2* vec2, int len, Dist& dist, typename Dist::result_type* smem, int … in calcVecDiffGlobal()
178 …onst T1* vecCached, const T2* vecGlob, int len, Dist& dist, typename Dist::result_type* smem, int … in calcVecDiffCached()
Dreduce.hpp59 __device__ __forceinline__ void reduce(volatile T* smem, T& val, unsigned int tid, const Op& op) in reduce()
67 …ce__ __forceinline__ void reduce(const thrust::tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem, in reduce()
/external/opencv3/modules/cudev/include/opencv2/cudev/block/detail/
Dreduce.hpp85 get<I>(smem)[tid] = get<I>(val); in loadToSmem() local
102 get<I>(smem)[tid] = get<I>(val) = get<I>(op)(get<I>(val), reg); in merge() local
146 __device__ __forceinline__ void loadToSmem(volatile T* smem, T& val, uint tid) in loadToSmem()
152 __device__ __forceinline__ void loadFromSmem(volatile T* smem, T& val, uint tid) in loadFromSmem()
159 …device__ __forceinline__ void loadToSmem(const tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem, in loadToSmem()
168 …vice__ __forceinline__ void loadFromSmem(const tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem, in loadFromSmem()
178 …__device__ __forceinline__ void merge(volatile T* smem, T& val, uint tid, uint delta, const Op& op) in merge()
187 __device__ __forceinline__ void merge(const tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem, in merge()
Dreduce_key_val.hpp84 get<I>(smem)[tid] = get<I>(data); in loadToSmem() local
152 __device__ __forceinline__ void loadToSmem(volatile T* smem, T& data, uint tid) in loadToSmem()
158 __device__ __forceinline__ void loadFromSmem(volatile T* smem, T& data, uint tid) in loadFromSmem()
165 …_forceinline__ void loadToSmem(const tuple<VP0, VP1, VP2, VP3, VP4, VP5, VP6, VP7, VP8, VP9>& smem, in loadToSmem()
174 …orceinline__ void loadFromSmem(const tuple<VP0, VP1, VP2, VP3, VP4, VP5, VP6, VP7, VP8, VP9>& smem, in loadFromSmem()
/external/opencv3/modules/cudev/include/opencv2/cudev/block/
Dscan.hpp58 __device__ T blockScanInclusive(T data, volatile T* smem, uint tid) in blockScanInclusive()
97 __device__ __forceinline__ T blockScanExclusive(T data, volatile T* smem, uint tid) in blockScanExclusive()
Dreduce.hpp63 __device__ __forceinline__ void blockReduce(volatile T* smem, T& val, uint tid, const Op& op) in blockReduce()
72 …evice__ __forceinline__ void blockReduce(const tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem, in blockReduce()
/external/opencv3/modules/cudev/include/opencv2/cudev/warp/
Dscan.hpp59 __device__ T warpScanInclusive(T data, volatile T* smem, uint tid) in warpScanInclusive()
95 __device__ __forceinline__ T warpScanExclusive(T data, volatile T* smem, uint tid) in warpScanExclusive()
Dreduce.hpp62 __device__ __forceinline__ void warpReduce(volatile T* smem, T& val, uint tid, const Op& op) in warpReduce()
70 …device__ __forceinline__ void warpReduce(const tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem, in warpReduce()
/external/opencv3/modules/core/include/opencv2/core/cuda/detail/
Dreduce.hpp76 thrust::get<I>(smem)[tid] = thrust::get<I>(val); in loadToSmem() local
92 … thrust::get<I>(smem)[tid] = thrust::get<I>(val) = thrust::get<I>(op)(thrust::get<I>(val), reg); in merge() local
128 __device__ __forceinline__ void loadToSmem(volatile T* smem, T& val, unsigned int tid) in loadToSmem()
133 __device__ __forceinline__ void loadFromSmem(volatile T* smem, T& val, unsigned int tid) in loadFromSmem()
139 … __forceinline__ void loadToSmem(const thrust::tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem, in loadToSmem()
147 …_forceinline__ void loadFromSmem(const thrust::tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem, in loadFromSmem()
155 …__device__ __forceinline__ void merge(volatile T* smem, T& val, unsigned int tid, unsigned int del… in merge()
169 …ice__ __forceinline__ void merge(const thrust::tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem, in merge()
Dreduce_key_val.hpp76 thrust::get<I>(smem)[tid] = thrust::get<I>(data); in loadToSmem() local
171 __device__ __forceinline__ void loadToSmem(volatile T* smem, T& data, unsigned int tid) in loadToSmem()
176 __device__ __forceinline__ void loadFromSmem(volatile T* smem, T& data, unsigned int tid) in loadFromSmem()
182 …line__ void loadToSmem(const thrust::tuple<VP0, VP1, VP2, VP3, VP4, VP5, VP6, VP7, VP8, VP9>& smem, in loadToSmem()
190 …ne__ void loadFromSmem(const thrust::tuple<VP0, VP1, VP2, VP3, VP4, VP5, VP6, VP7, VP8, VP9>& smem, in loadFromSmem()
/external/opencv3/modules/cudev/include/opencv2/cudev/warp/detail/
Dreduce.hpp83 get<I>(smem)[tid] = get<I>(val); in loadToSmem() local
92 get<I>(smem)[tid] = get<I>(val) = get<I>(op)(get<I>(val), reg); in merge() local
132 __device__ __forceinline__ void loadToSmem(volatile T* smem, T& val, uint tid) in loadToSmem()
139 …device__ __forceinline__ void loadToSmem(const tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem, in loadToSmem()
149 …__device__ __forceinline__ void merge(volatile T* smem, T& val, uint tid, uint delta, const Op& op) in merge()
158 __device__ __forceinline__ void merge(const tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem, in merge()
Dreduce_key_val.hpp82 get<I>(smem)[tid] = get<I>(data); in loadToSmem() local
137 __device__ __forceinline__ void loadToSmem(volatile T* smem, T& data, uint tid) in loadToSmem()
144 …_forceinline__ void loadToSmem(const tuple<VP0, VP1, VP2, VP3, VP4, VP5, VP6, VP7, VP8, VP9>& smem, in loadToSmem()
/external/opencv3/modules/cudev/include/opencv2/cudev/grid/detail/
Dreduce.hpp71 __device__ __forceinline__ static volatile R* smem(R* ptr) in smem() function
92 __device__ __forceinline__ static tuple<volatile R*, volatile R*> smem(R* ptr) in smem() function
113 __device__ __forceinline__ static tuple<volatile R*, volatile R*, volatile R*> smem(R* ptr) in smem() function
136 …ice__ __forceinline__ static tuple<volatile R*, volatile R*, volatile R*, volatile R*> smem(R* ptr) in smem() function
279 __shared__ work_elem_type smem[BLOCK_SIZE * cn]; in reduceGrid() local
339 __shared__ work_type smem[BLOCK_SIZE]; in reduceGrid() local
Dhistogram.hpp60 __shared__ ResType smem[BIN_COUNT]; in histogram() local
Dreduce_to_row.hpp62 __shared__ work_type smem[BLOCK_SIZE_X * BLOCK_SIZE_Y]; in reduceToRow() local
Dintegral.hpp63 __shared__ D smem[NUM_SCAN_THREADS * 2]; in horizontal_pass() local
105 __shared__ D smem[NUM_SCAN_THREADS * 2]; in horizontal_pass() local
Dpyr_down.hpp68 __shared__ work_type smem[256 + 4]; in pyrDown() local
Dreduce_to_column.hpp102 __shared__ work_elem_type smem[cn][BLOCK_SIZE]; in reduceToColumn() local
/external/opencv3/modules/cudaoptflow/src/cuda/
Dfarneback.cu140 int smem = 3 * block.x * sizeof(float); in polynomialExpansionGpu() local
422 int smem = (block.x + 2*ksizeHalf) * 5 * block.y * sizeof(float); in boxFilter5Gpu() local
441 int smem = (block.x + 2*ksizeHalf) * 5 * block.y * sizeof(float); in boxFilter5Gpu_CC11() local
509 int smem = (block.x + 2*ksizeHalf) * block.y * sizeof(float); in gaussianBlurCaller() local
607 int smem = (block.x + 2*ksizeHalf) * 5 * block.y * sizeof(float); in gaussianBlur5Caller() local
/external/opencv3/modules/cudawarping/src/cuda/
Dpyr_down.cu59 __shared__ work_t smem[256 + 4]; in pyrDown() local
/external/opencv3/modules/cudafilters/src/cuda/
Dcolumn_filter.hpp74 __shared__ sum_t smem[(PATCH_PER_BLOCK + 2 * HALO_SIZE) * BLOCK_DIM_Y][BLOCK_DIM_X]; in linearColumnFilter() local
Drow_filter.hpp74 __shared__ sum_t smem[BLOCK_DIM_Y][(PATCH_PER_BLOCK + 2 * HALO_SIZE) * BLOCK_DIM_X]; in linearRowFilter() local
/external/opencv3/modules/cudalegacy/src/cuda/
Dneedle_map.cu56 __shared__ float smem[2 * NEEDLE_MAP_SCALE]; in NeedleMapAverageKernel() local
/external/opencv3/modules/cudaimgproc/src/cuda/
Dclahe.cu61 __shared__ int smem[512]; in calcLutKernel() local

12