Home
last modified time | relevance | path

Searched refs:kNumWarps (Results 1 – 8 of 8) sorted by relevance

/dports/math/faiss/faiss-1.7.1/faiss/gpu/utils/
H A DBlockSelectKernel.cuh29 constexpr int kNumWarps = ThreadsPerBlock / kWarpSize; in blockSelect() local
31 __shared__ K smemK[kNumWarps * NumWarpQ]; in blockSelect()
32 __shared__ IndexType smemV[kNumWarps * NumWarpQ]; in blockSelect()
86 constexpr int kNumWarps = ThreadsPerBlock / kWarpSize; in blockSelectPair() local
88 __shared__ K smemK[kNumWarps * NumWarpQ]; in blockSelectPair()
89 __shared__ IndexType smemV[kNumWarps * NumWarpQ]; in blockSelectPair()
H A DWarpSelectKernel.cuh29 constexpr int kNumWarps = ThreadsPerBlock / kWarpSize; in warpSelect() local
42 int row = blockIdx.x * kNumWarps + warpId; in warpSelect()
H A DSelect.cuh148 static constexpr int kNumWarps = ThreadsPerBlock / kWarpSize; member
302 FinalBlockMerge<kNumWarps, ThreadsPerBlock, K, V, NumWarpQ, Dir, Comp>:: in reduce()
346 static constexpr int kNumWarps = ThreadsPerBlock / kWarpSize; member
397 for (int i = 1; i < kNumWarps; ++i) { in reduce()
597 static constexpr int kNumWarps = ThreadsPerBlock / kWarpSize; member
/dports/math/faiss/faiss-1.7.1/faiss/gpu/impl/
H A DIVFUtilsSelect1.cu32 constexpr int kNumWarps = ThreadsPerBlock / kWarpSize; in pass1SelectLists() local
34 __shared__ float smemK[kNumWarps * NumWarpQ]; in pass1SelectLists()
35 __shared__ int smemV[kNumWarps * NumWarpQ]; in pass1SelectLists()
H A DIVFUtilsSelect2.cu63 constexpr int kNumWarps = ThreadsPerBlock / kWarpSize; in pass2SelectLists() local
65 __shared__ float smemK[kNumWarps * NumWarpQ]; in pass2SelectLists()
66 __shared__ int smemV[kNumWarps * NumWarpQ]; in pass2SelectLists()
H A DIVFInterleaved.cu31 constexpr int kNumWarps = ThreadsPerBlock / kWarpSize; in ivfInterleavedScan2() local
33 __shared__ float smemK[kNumWarps * NumWarpQ]; in ivfInterleavedScan2()
34 __shared__ uint32_t smemV[kNumWarps * NumWarpQ]; in ivfInterleavedScan2()
H A DL2Select.cu137 constexpr int kNumWarps = ThreadsPerBlock / kWarpSize; in l2SelectMinK() local
139 __shared__ T smemK[kNumWarps * NumWarpQ]; in l2SelectMinK()
140 __shared__ int smemV[kNumWarps * NumWarpQ]; in l2SelectMinK()
H A DIVFInterleaved.cuh54 constexpr int kNumWarps = ThreadsPerBlock / kWarpSize; in ivfInterleavedScan() local
81 __shared__ float smemK[kNumWarps * NumWarpQ]; in ivfInterleavedScan()
82 __shared__ int smemV[kNumWarps * NumWarpQ]; in ivfInterleavedScan()
110 for (int block = warpId; block < numBlocks; block += kNumWarps) { in ivfInterleavedScan()