Searched refs:src_lane (Results 1 - 6 of 6) sorted by relevance
/external/tensorflow/tensorflow/core/util/ |
H A D | cuda_device_functions.h | 122 // defined value, assuming the calling lane will read from src_lane as part of 125 // Specifically, returns true iff mask has the calling lane bit and the src_lane 126 // bit set, and the src_lane calls this function with the same mask value 133 unsigned src_lane) { 134 unsigned src_dst_mask = 1u << CudaLaneId() | 1u << src_lane; 136 unsigned src_lane_mask = __shfl_sync(mask, mask, src_lane); 138 unsigned src_lane_mask = __shfl(mask, src_lane); 144 __device__ inline unsigned CudaShuffleGetSrcLane(int src_lane, int width) { 147 int lane_offset = src_lane & width - 1; 173 int src_lane [all...] |
H A D | cuda_kernel_helper_test.cu.cc | 101 for (int src_lane = -warpSize; src_lane <= warpSize; ++src_lane) { 102 unsigned actual_lane = detail::CudaShuffleGetSrcLane(src_lane, width); 104 CudaShuffleSync(kCudaWarpAll, lane_id, src_lane, width); 105 check_result("Shuffle", src_lane, actual_lane, expect_lane);
|
H A D | cuda_kernel_helper.h | 69 int src_lane, 72 CudaShuffleSync(mask, static_cast<uint16>(value), src_lane, width)); 68 CudaShuffleSync(unsigned mask, Eigen::half value, int src_lane, int width = warpSize) argument
|
/external/v8/src/arm/ |
H A D | macro-assembler-arm.h | 567 void ReplaceLane(QwNeonRegister dst, QwNeonRegister src, Register src_lane, 570 SwVfpRegister src_lane, Register scratch, int lane);
|
H A D | macro-assembler-arm.cc | 1166 Register src_lane, NeonDataType dt, int lane) { 1175 vmov(dt, double_dst, double_lane, src_lane); 1179 SwVfpRegister src_lane, Register scratch, 1183 VmovExtended(s_code, src_lane.code(), scratch);
|
/external/vixl/src/aarch64/ |
H A D | logic-aarch64.cc | 1720 uint64_t src_lane = src.Uint(vform, i); local 1722 uint64_t shifted = src_lane << shift; 1772 uint64_t src_lane = src.Uint(vform, i); local 1780 shifted = src_lane >> shift;
|
Completed in 406 milliseconds