Home
last modified time | relevance | path

Searched refs:KernelDescriptor (Results 1 – 10 of 10) sorted by relevance

/aosp_15_r20/external/pytorch/aten/src/ATen/native/cuda/
H A Djit_utils.h21 struct KernelDescriptor { struct
41 KernelDescriptor make_kernel_descriptor( in make_kernel_descriptor() argument
46 KernelDescriptor ret; in make_kernel_descriptor()
68 inline int can_vectorize_up_to(const KernelDescriptor &desc, c10::ArrayRef<char*> pointers) { in can_vectorize_up_to()
102 const KernelDescriptor &desc,
124 const KernelDescriptor &desc,
H A DCUDAJitLoops.cuh79 const at::cuda::jit::KernelDescriptor &desc, in launch_jitted_unrolled_kernel()
114 const at::cuda::jit::KernelDescriptor &desc, int64_t N, array_t data, in launch_jitted_vectorized_kernel()
179 const at::cuda::jit::KernelDescriptor &desc, in jitted_gpu_kernel_generic()
H A Djit_utils.cpp937 const KernelDescriptor &desc, in generate_code()
1305 const KernelDescriptor &desc, in generate_reduction_code()
H A DReduce.cuh905 const at::cuda::jit::KernelDescriptor &desc, in launch_jitted_reduce_kernel()
/aosp_15_r20/external/swiftshader/third_party/llvm-16.0/llvm/lib/Target/AMDGPU/MCTargetDesc/
H A DAMDGPUTargetStreamer.cpp852 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR, in EmitAmdhsaKernelDescriptor() argument
870 MCConstantExpr::create(sizeof(KernelDescriptor), Context)); in EmitAmdhsaKernelDescriptor()
878 Streamer.emitInt32(KernelDescriptor.group_segment_fixed_size); in EmitAmdhsaKernelDescriptor()
879 Streamer.emitInt32(KernelDescriptor.private_segment_fixed_size); in EmitAmdhsaKernelDescriptor()
880 Streamer.emitInt32(KernelDescriptor.kernarg_size); in EmitAmdhsaKernelDescriptor()
882 for (uint8_t Res : KernelDescriptor.reserved0) in EmitAmdhsaKernelDescriptor()
895 sizeof(KernelDescriptor.kernel_code_entry_byte_offset)); in EmitAmdhsaKernelDescriptor()
896 for (uint8_t Res : KernelDescriptor.reserved1) in EmitAmdhsaKernelDescriptor()
898 Streamer.emitInt32(KernelDescriptor.compute_pgm_rsrc3); in EmitAmdhsaKernelDescriptor()
899 Streamer.emitInt32(KernelDescriptor.compute_pgm_rsrc1); in EmitAmdhsaKernelDescriptor()
[all …]
H A DAMDGPUTargetStreamer.h95 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR, in EmitAmdhsaKernelDescriptor() argument
155 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR,
215 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR,
/aosp_15_r20/external/swiftshader/third_party/llvm-10.0/llvm/lib/Target/AMDGPU/MCTargetDesc/
H A DAMDGPUTargetStreamer.cpp614 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR, in EmitAmdhsaKernelDescriptor() argument
633 MCConstantExpr::create(sizeof(KernelDescriptor), Context)); in EmitAmdhsaKernelDescriptor()
642 (const char*)&(KernelDescriptor), in EmitAmdhsaKernelDescriptor()
654 sizeof(KernelDescriptor.kernel_code_entry_byte_offset)); in EmitAmdhsaKernelDescriptor()
656 (const char*)&(KernelDescriptor) + in EmitAmdhsaKernelDescriptor()
658 sizeof(KernelDescriptor.kernel_code_entry_byte_offset), in EmitAmdhsaKernelDescriptor()
659 sizeof(KernelDescriptor) - in EmitAmdhsaKernelDescriptor()
661 sizeof(KernelDescriptor.kernel_code_entry_byte_offset))); in EmitAmdhsaKernelDescriptor()
H A DAMDGPUTargetStreamer.h85 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR,
129 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR,
176 const amdhsa::kernel_descriptor_t &KernelDescriptor, uint64_t NextVGPR,
/aosp_15_r20/external/swiftshader/third_party/llvm-16.0/llvm/lib/Target/AMDGPU/
H A DAMDGPUAsmPrinter.cpp427 amdhsa::kernel_descriptor_t KernelDescriptor; in getAmdhsaKernelDescriptor() local
428 memset(&KernelDescriptor, 0x0, sizeof(KernelDescriptor)); in getAmdhsaKernelDescriptor()
434 KernelDescriptor.group_segment_fixed_size = PI.LDSSize; in getAmdhsaKernelDescriptor()
435 KernelDescriptor.private_segment_fixed_size = PI.ScratchSize; in getAmdhsaKernelDescriptor()
438 KernelDescriptor.kernarg_size = STM.getKernArgSegmentSize(F, MaxKernArgAlign); in getAmdhsaKernelDescriptor()
440 KernelDescriptor.compute_pgm_rsrc1 = PI.getComputePGMRSrc1(); in getAmdhsaKernelDescriptor()
441 KernelDescriptor.compute_pgm_rsrc2 = PI.ComputePGMRSrc2; in getAmdhsaKernelDescriptor()
442 KernelDescriptor.kernel_code_properties = getAmdhsaKernelCodeProperties(MF); in getAmdhsaKernelDescriptor()
446 KernelDescriptor.compute_pgm_rsrc3 = in getAmdhsaKernelDescriptor()
449 return KernelDescriptor; in getAmdhsaKernelDescriptor()
/aosp_15_r20/external/swiftshader/third_party/llvm-10.0/llvm/lib/Target/AMDGPU/
H A DAMDGPUAsmPrinter.cpp403 amdhsa::kernel_descriptor_t KernelDescriptor; in getAmdhsaKernelDescriptor() local
404 memset(&KernelDescriptor, 0x0, sizeof(KernelDescriptor)); in getAmdhsaKernelDescriptor()
410 KernelDescriptor.group_segment_fixed_size = PI.LDSSize; in getAmdhsaKernelDescriptor()
411 KernelDescriptor.private_segment_fixed_size = PI.ScratchSize; in getAmdhsaKernelDescriptor()
412 KernelDescriptor.compute_pgm_rsrc1 = PI.ComputePGMRSrc1; in getAmdhsaKernelDescriptor()
413 KernelDescriptor.compute_pgm_rsrc2 = PI.ComputePGMRSrc2; in getAmdhsaKernelDescriptor()
414 KernelDescriptor.kernel_code_properties = getAmdhsaKernelCodeProperties(MF); in getAmdhsaKernelDescriptor()
416 return KernelDescriptor; in getAmdhsaKernelDescriptor()