Searched refs:KernelDescriptor (Results 1 – 10 of 10) sorted by relevance
/aosp_15_r20/external/pytorch/aten/src/ATen/native/cuda/ |
H A D | jit_utils.h | 21 struct KernelDescriptor { struct 41 KernelDescriptor make_kernel_descriptor( in make_kernel_descriptor() argument 46 KernelDescriptor ret; in make_kernel_descriptor() 68 inline int can_vectorize_up_to(const KernelDescriptor &desc, c10::ArrayRef<char*> pointers) { in can_vectorize_up_to() 102 const KernelDescriptor &desc, 124 const KernelDescriptor &desc,
|
H A D | CUDAJitLoops.cuh | 79 const at::cuda::jit::KernelDescriptor &desc, in launch_jitted_unrolled_kernel() 114 const at::cuda::jit::KernelDescriptor &desc, int64_t N, array_t data, in launch_jitted_vectorized_kernel() 179 const at::cuda::jit::KernelDescriptor &desc, in jitted_gpu_kernel_generic()
|
H A D | jit_utils.cpp | 937 const KernelDescriptor &desc, in generate_code() 1305 const KernelDescriptor &desc, in generate_reduction_code()
|
H A D | Reduce.cuh | 905 const at::cuda::jit::KernelDescriptor &desc, in launch_jitted_reduce_kernel()
|
/aosp_15_r20/external/swiftshader/third_party/llvm-16.0/llvm/lib/Target/AMDGPU/MCTargetDesc/ |
H A D | AMDGPUTargetStreamer.cpp | 852 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR, in EmitAmdhsaKernelDescriptor() argument 870 MCConstantExpr::create(sizeof(KernelDescriptor), Context)); in EmitAmdhsaKernelDescriptor() 878 Streamer.emitInt32(KernelDescriptor.group_segment_fixed_size); in EmitAmdhsaKernelDescriptor() 879 Streamer.emitInt32(KernelDescriptor.private_segment_fixed_size); in EmitAmdhsaKernelDescriptor() 880 Streamer.emitInt32(KernelDescriptor.kernarg_size); in EmitAmdhsaKernelDescriptor() 882 for (uint8_t Res : KernelDescriptor.reserved0) in EmitAmdhsaKernelDescriptor() 895 sizeof(KernelDescriptor.kernel_code_entry_byte_offset)); in EmitAmdhsaKernelDescriptor() 896 for (uint8_t Res : KernelDescriptor.reserved1) in EmitAmdhsaKernelDescriptor() 898 Streamer.emitInt32(KernelDescriptor.compute_pgm_rsrc3); in EmitAmdhsaKernelDescriptor() 899 Streamer.emitInt32(KernelDescriptor.compute_pgm_rsrc1); in EmitAmdhsaKernelDescriptor() [all …]
|
H A D | AMDGPUTargetStreamer.h | 95 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR, in EmitAmdhsaKernelDescriptor() argument 155 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR, 215 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR,
|
/aosp_15_r20/external/swiftshader/third_party/llvm-10.0/llvm/lib/Target/AMDGPU/MCTargetDesc/ |
H A D | AMDGPUTargetStreamer.cpp | 614 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR, in EmitAmdhsaKernelDescriptor() argument 633 MCConstantExpr::create(sizeof(KernelDescriptor), Context)); in EmitAmdhsaKernelDescriptor() 642 (const char*)&(KernelDescriptor), in EmitAmdhsaKernelDescriptor() 654 sizeof(KernelDescriptor.kernel_code_entry_byte_offset)); in EmitAmdhsaKernelDescriptor() 656 (const char*)&(KernelDescriptor) + in EmitAmdhsaKernelDescriptor() 658 sizeof(KernelDescriptor.kernel_code_entry_byte_offset), in EmitAmdhsaKernelDescriptor() 659 sizeof(KernelDescriptor) - in EmitAmdhsaKernelDescriptor() 661 sizeof(KernelDescriptor.kernel_code_entry_byte_offset))); in EmitAmdhsaKernelDescriptor()
|
H A D | AMDGPUTargetStreamer.h | 85 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR, 129 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR, 176 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR,
|
/aosp_15_r20/external/swiftshader/third_party/llvm-16.0/llvm/lib/Target/AMDGPU/ |
H A D | AMDGPUAsmPrinter.cpp | 427 amdhsa::kernel_descriptor_t KernelDescriptor; in getAmdhsaKernelDescriptor() local 428 memset(&KernelDescriptor, 0x0, sizeof(KernelDescriptor)); in getAmdhsaKernelDescriptor() 434 KernelDescriptor.group_segment_fixed_size = PI.LDSSize; in getAmdhsaKernelDescriptor() 435 KernelDescriptor.private_segment_fixed_size = PI.ScratchSize; in getAmdhsaKernelDescriptor() 438 KernelDescriptor.kernarg_size = STM.getKernArgSegmentSize(F, MaxKernArgAlign); in getAmdhsaKernelDescriptor() 440 KernelDescriptor.compute_pgm_rsrc1 = PI.getComputePGMRSrc1(); in getAmdhsaKernelDescriptor() 441 KernelDescriptor.compute_pgm_rsrc2 = PI.ComputePGMRSrc2; in getAmdhsaKernelDescriptor() 442 KernelDescriptor.kernel_code_properties = getAmdhsaKernelCodeProperties(MF); in getAmdhsaKernelDescriptor() 446 KernelDescriptor.compute_pgm_rsrc3 = in getAmdhsaKernelDescriptor() 449 return KernelDescriptor; in getAmdhsaKernelDescriptor()
|
/aosp_15_r20/external/swiftshader/third_party/llvm-10.0/llvm/lib/Target/AMDGPU/ |
H A D | AMDGPUAsmPrinter.cpp | 403 amdhsa::kernel_descriptor_t KernelDescriptor; in getAmdhsaKernelDescriptor() local 404 memset(&KernelDescriptor, 0x0, sizeof(KernelDescriptor)); in getAmdhsaKernelDescriptor() 410 KernelDescriptor.group_segment_fixed_size = PI.LDSSize; in getAmdhsaKernelDescriptor() 411 KernelDescriptor.private_segment_fixed_size = PI.ScratchSize; in getAmdhsaKernelDescriptor() 412 KernelDescriptor.compute_pgm_rsrc1 = PI.ComputePGMRSrc1; in getAmdhsaKernelDescriptor() 413 KernelDescriptor.compute_pgm_rsrc2 = PI.ComputePGMRSrc2; in getAmdhsaKernelDescriptor() 414 KernelDescriptor.kernel_code_properties = getAmdhsaKernelCodeProperties(MF); in getAmdhsaKernelDescriptor() 416 return KernelDescriptor; in getAmdhsaKernelDescriptor()
|