| .. | .. |
|---|
| 33 | 33 | #include <linux/time.h> |
|---|
| 34 | 34 | #include <linux/mm.h> |
|---|
| 35 | 35 | #include <linux/mman.h> |
|---|
| 36 | +#include <linux/dma-buf.h> |
|---|
| 36 | 37 | #include <asm/processor.h> |
|---|
| 37 | 38 | #include "kfd_priv.h" |
|---|
| 38 | 39 | #include "kfd_device_queue_manager.h" |
|---|
| 39 | 40 | #include "kfd_dbgmgr.h" |
|---|
| 41 | +#include "amdgpu_amdkfd.h" |
|---|
| 42 | +#include "kfd_smi_events.h" |
|---|
| 40 | 43 | |
|---|
| 41 | 44 | static long kfd_ioctl(struct file *, unsigned int, unsigned long); |
|---|
| 42 | 45 | static int kfd_open(struct inode *, struct file *); |
|---|
| 46 | +static int kfd_release(struct inode *, struct file *); |
|---|
| 43 | 47 | static int kfd_mmap(struct file *, struct vm_area_struct *); |
|---|
| 44 | 48 | |
|---|
| 45 | 49 | static const char kfd_dev_name[] = "kfd"; |
|---|
| .. | .. |
|---|
| 47 | 51 | static const struct file_operations kfd_fops = { |
|---|
| 48 | 52 | .owner = THIS_MODULE, |
|---|
| 49 | 53 | .unlocked_ioctl = kfd_ioctl, |
|---|
| 50 | | - .compat_ioctl = kfd_ioctl, |
|---|
| 54 | + .compat_ioctl = compat_ptr_ioctl, |
|---|
| 51 | 55 | .open = kfd_open, |
|---|
| 56 | + .release = kfd_release, |
|---|
| 52 | 57 | .mmap = kfd_mmap, |
|---|
| 53 | 58 | }; |
|---|
| 54 | 59 | |
|---|
| .. | .. |
|---|
| 92 | 97 | device_destroy(kfd_class, MKDEV(kfd_char_dev_major, 0)); |
|---|
| 93 | 98 | class_destroy(kfd_class); |
|---|
| 94 | 99 | unregister_chrdev(kfd_char_dev_major, kfd_dev_name); |
|---|
| 100 | + kfd_device = NULL; |
|---|
| 95 | 101 | } |
|---|
| 96 | 102 | |
|---|
| 97 | 103 | struct device *kfd_chardev(void) |
|---|
| .. | .. |
|---|
| 122 | 128 | if (IS_ERR(process)) |
|---|
| 123 | 129 | return PTR_ERR(process); |
|---|
| 124 | 130 | |
|---|
| 125 | | - if (kfd_is_locked()) |
|---|
| 131 | + if (kfd_is_locked()) { |
|---|
| 132 | + dev_dbg(kfd_device, "kfd is locked!\n" |
|---|
| 133 | + "process %d unreferenced", process->pasid); |
|---|
| 134 | + kfd_unref_process(process); |
|---|
| 126 | 135 | return -EAGAIN; |
|---|
| 136 | + } |
|---|
| 137 | + |
|---|
| 138 | + /* filep now owns the reference returned by kfd_create_process */ |
|---|
| 139 | + filep->private_data = process; |
|---|
| 127 | 140 | |
|---|
| 128 | 141 | dev_dbg(kfd_device, "process %d opened, compat mode (32 bit) - %d\n", |
|---|
| 129 | 142 | process->pasid, process->is_32bit_user_mode); |
|---|
| 143 | + |
|---|
| 144 | + return 0; |
|---|
| 145 | +} |
|---|
| 146 | + |
|---|
| 147 | +static int kfd_release(struct inode *inode, struct file *filep) |
|---|
| 148 | +{ |
|---|
| 149 | + struct kfd_process *process = filep->private_data; |
|---|
| 150 | + |
|---|
| 151 | + if (process) |
|---|
| 152 | + kfd_unref_process(process); |
|---|
| 130 | 153 | |
|---|
| 131 | 154 | return 0; |
|---|
| 132 | 155 | } |
|---|
| .. | .. |
|---|
| 156 | 179 | } |
|---|
| 157 | 180 | |
|---|
| 158 | 181 | if ((args->ring_base_address) && |
|---|
| 159 | | - (!access_ok(VERIFY_WRITE, |
|---|
| 160 | | - (const void __user *) args->ring_base_address, |
|---|
| 182 | + (!access_ok((const void __user *) args->ring_base_address, |
|---|
| 161 | 183 | sizeof(uint64_t)))) { |
|---|
| 162 | 184 | pr_err("Can't access ring base address\n"); |
|---|
| 163 | 185 | return -EFAULT; |
|---|
| .. | .. |
|---|
| 168 | 190 | return -EINVAL; |
|---|
| 169 | 191 | } |
|---|
| 170 | 192 | |
|---|
| 171 | | - if (!access_ok(VERIFY_WRITE, |
|---|
| 172 | | - (const void __user *) args->read_pointer_address, |
|---|
| 193 | + if (!access_ok((const void __user *) args->read_pointer_address, |
|---|
| 173 | 194 | sizeof(uint32_t))) { |
|---|
| 174 | 195 | pr_err("Can't access read pointer\n"); |
|---|
| 175 | 196 | return -EFAULT; |
|---|
| 176 | 197 | } |
|---|
| 177 | 198 | |
|---|
| 178 | | - if (!access_ok(VERIFY_WRITE, |
|---|
| 179 | | - (const void __user *) args->write_pointer_address, |
|---|
| 199 | + if (!access_ok((const void __user *) args->write_pointer_address, |
|---|
| 180 | 200 | sizeof(uint32_t))) { |
|---|
| 181 | 201 | pr_err("Can't access write pointer\n"); |
|---|
| 182 | 202 | return -EFAULT; |
|---|
| 183 | 203 | } |
|---|
| 184 | 204 | |
|---|
| 185 | 205 | if (args->eop_buffer_address && |
|---|
| 186 | | - !access_ok(VERIFY_WRITE, |
|---|
| 187 | | - (const void __user *) args->eop_buffer_address, |
|---|
| 206 | + !access_ok((const void __user *) args->eop_buffer_address, |
|---|
| 188 | 207 | sizeof(uint32_t))) { |
|---|
| 189 | 208 | pr_debug("Can't access eop buffer"); |
|---|
| 190 | 209 | return -EFAULT; |
|---|
| 191 | 210 | } |
|---|
| 192 | 211 | |
|---|
| 193 | 212 | if (args->ctx_save_restore_address && |
|---|
| 194 | | - !access_ok(VERIFY_WRITE, |
|---|
| 195 | | - (const void __user *) args->ctx_save_restore_address, |
|---|
| 213 | + !access_ok((const void __user *) args->ctx_save_restore_address, |
|---|
| 196 | 214 | sizeof(uint32_t))) { |
|---|
| 197 | 215 | pr_debug("Can't access ctx save restore buffer"); |
|---|
| 198 | 216 | return -EFAULT; |
|---|
| 199 | 217 | } |
|---|
| 200 | 218 | |
|---|
| 201 | 219 | q_properties->is_interop = false; |
|---|
| 220 | + q_properties->is_gws = false; |
|---|
| 202 | 221 | q_properties->queue_percent = args->queue_percentage; |
|---|
| 203 | 222 | q_properties->priority = args->queue_priority; |
|---|
| 204 | 223 | q_properties->queue_address = args->ring_base_address; |
|---|
| .. | .. |
|---|
| 216 | 235 | q_properties->type = KFD_QUEUE_TYPE_COMPUTE; |
|---|
| 217 | 236 | else if (args->queue_type == KFD_IOC_QUEUE_TYPE_SDMA) |
|---|
| 218 | 237 | q_properties->type = KFD_QUEUE_TYPE_SDMA; |
|---|
| 238 | + else if (args->queue_type == KFD_IOC_QUEUE_TYPE_SDMA_XGMI) |
|---|
| 239 | + q_properties->type = KFD_QUEUE_TYPE_SDMA_XGMI; |
|---|
| 219 | 240 | else |
|---|
| 220 | 241 | return -ENOTSUPP; |
|---|
| 221 | 242 | |
|---|
| .. | .. |
|---|
| 259 | 280 | unsigned int queue_id; |
|---|
| 260 | 281 | struct kfd_process_device *pdd; |
|---|
| 261 | 282 | struct queue_properties q_properties; |
|---|
| 283 | + uint32_t doorbell_offset_in_process = 0; |
|---|
| 262 | 284 | |
|---|
| 263 | 285 | memset(&q_properties, 0, sizeof(struct queue_properties)); |
|---|
| 264 | 286 | |
|---|
| .. | .. |
|---|
| 283 | 305 | goto err_bind_process; |
|---|
| 284 | 306 | } |
|---|
| 285 | 307 | |
|---|
| 286 | | - pr_debug("Creating queue for PASID %d on gpu 0x%x\n", |
|---|
| 308 | + pr_debug("Creating queue for PASID 0x%x on gpu 0x%x\n", |
|---|
| 287 | 309 | p->pasid, |
|---|
| 288 | 310 | dev->id); |
|---|
| 289 | 311 | |
|---|
| 290 | | - err = pqm_create_queue(&p->pqm, dev, filep, &q_properties, &queue_id); |
|---|
| 312 | + err = pqm_create_queue(&p->pqm, dev, filep, &q_properties, &queue_id, |
|---|
| 313 | + &doorbell_offset_in_process); |
|---|
| 291 | 314 | if (err != 0) |
|---|
| 292 | 315 | goto err_create_queue; |
|---|
| 293 | 316 | |
|---|
| .. | .. |
|---|
| 297 | 320 | /* Return gpu_id as doorbell offset for mmap usage */ |
|---|
| 298 | 321 | args->doorbell_offset = KFD_MMAP_TYPE_DOORBELL; |
|---|
| 299 | 322 | args->doorbell_offset |= KFD_MMAP_GPU_ID(args->gpu_id); |
|---|
| 300 | | - args->doorbell_offset <<= PAGE_SHIFT; |
|---|
| 301 | 323 | if (KFD_IS_SOC15(dev->device_info->asic_family)) |
|---|
| 302 | | - /* On SOC15 ASICs, doorbell allocation must be |
|---|
| 303 | | - * per-device, and independent from the per-process |
|---|
| 304 | | - * queue_id. Return the doorbell offset within the |
|---|
| 305 | | - * doorbell aperture to user mode. |
|---|
| 324 | + /* On SOC15 ASICs, include the doorbell offset within the |
|---|
| 325 | + * process doorbell frame, which is 2 pages. |
|---|
| 306 | 326 | */ |
|---|
| 307 | | - args->doorbell_offset |= q_properties.doorbell_off; |
|---|
| 327 | + args->doorbell_offset |= doorbell_offset_in_process; |
|---|
| 308 | 328 | |
|---|
| 309 | 329 | mutex_unlock(&p->mutex); |
|---|
| 310 | 330 | |
|---|
| .. | .. |
|---|
| 333 | 353 | int retval; |
|---|
| 334 | 354 | struct kfd_ioctl_destroy_queue_args *args = data; |
|---|
| 335 | 355 | |
|---|
| 336 | | - pr_debug("Destroying queue id %d for pasid %d\n", |
|---|
| 356 | + pr_debug("Destroying queue id %d for pasid 0x%x\n", |
|---|
| 337 | 357 | args->queue_id, |
|---|
| 338 | 358 | p->pasid); |
|---|
| 339 | 359 | |
|---|
| .. | .. |
|---|
| 363 | 383 | } |
|---|
| 364 | 384 | |
|---|
| 365 | 385 | if ((args->ring_base_address) && |
|---|
| 366 | | - (!access_ok(VERIFY_WRITE, |
|---|
| 367 | | - (const void __user *) args->ring_base_address, |
|---|
| 386 | + (!access_ok((const void __user *) args->ring_base_address, |
|---|
| 368 | 387 | sizeof(uint64_t)))) { |
|---|
| 369 | 388 | pr_err("Can't access ring base address\n"); |
|---|
| 370 | 389 | return -EFAULT; |
|---|
| .. | .. |
|---|
| 380 | 399 | properties.queue_percent = args->queue_percentage; |
|---|
| 381 | 400 | properties.priority = args->queue_priority; |
|---|
| 382 | 401 | |
|---|
| 383 | | - pr_debug("Updating queue id %d for pasid %d\n", |
|---|
| 402 | + pr_debug("Updating queue id %d for pasid 0x%x\n", |
|---|
| 384 | 403 | args->queue_id, p->pasid); |
|---|
| 385 | 404 | |
|---|
| 386 | 405 | mutex_lock(&p->mutex); |
|---|
| .. | .. |
|---|
| 447 | 466 | return retval; |
|---|
| 448 | 467 | } |
|---|
| 449 | 468 | |
|---|
| 469 | +static int kfd_ioctl_get_queue_wave_state(struct file *filep, |
|---|
| 470 | + struct kfd_process *p, void *data) |
|---|
| 471 | +{ |
|---|
| 472 | + struct kfd_ioctl_get_queue_wave_state_args *args = data; |
|---|
| 473 | + int r; |
|---|
| 474 | + |
|---|
| 475 | + mutex_lock(&p->mutex); |
|---|
| 476 | + |
|---|
| 477 | + r = pqm_get_wave_state(&p->pqm, args->queue_id, |
|---|
| 478 | + (void __user *)args->ctl_stack_address, |
|---|
| 479 | + &args->ctl_stack_used_size, |
|---|
| 480 | + &args->save_area_used_size); |
|---|
| 481 | + |
|---|
| 482 | + mutex_unlock(&p->mutex); |
|---|
| 483 | + |
|---|
| 484 | + return r; |
|---|
| 485 | +} |
|---|
| 486 | + |
|---|
| 450 | 487 | static int kfd_ioctl_set_memory_policy(struct file *filep, |
|---|
| 451 | 488 | struct kfd_process *p, void *data) |
|---|
| 452 | 489 | { |
|---|
| .. | .. |
|---|
| 508 | 545 | struct kfd_process_device *pdd; |
|---|
| 509 | 546 | |
|---|
| 510 | 547 | dev = kfd_device_by_id(args->gpu_id); |
|---|
| 511 | | - if (dev == NULL) |
|---|
| 548 | + if (!dev) |
|---|
| 512 | 549 | return -EINVAL; |
|---|
| 513 | 550 | |
|---|
| 514 | 551 | mutex_lock(&p->mutex); |
|---|
| .. | .. |
|---|
| 816 | 853 | dev = kfd_device_by_id(args->gpu_id); |
|---|
| 817 | 854 | if (dev) |
|---|
| 818 | 855 | /* Reading GPU clock counter from KGD */ |
|---|
| 819 | | - args->gpu_clock_counter = |
|---|
| 820 | | - dev->kfd2kgd->get_gpu_clock_counter(dev->kgd); |
|---|
| 856 | + args->gpu_clock_counter = amdgpu_amdkfd_get_gpu_clock_counter(dev->kgd); |
|---|
| 821 | 857 | else |
|---|
| 822 | 858 | /* Node without GPU resource */ |
|---|
| 823 | 859 | args->gpu_clock_counter = 0; |
|---|
| 824 | 860 | |
|---|
| 825 | 861 | /* No access to rdtsc. Using raw monotonic time */ |
|---|
| 826 | 862 | args->cpu_clock_counter = ktime_get_raw_ns(); |
|---|
| 827 | | - args->system_clock_counter = ktime_get_boot_ns(); |
|---|
| 863 | + args->system_clock_counter = ktime_get_boottime_ns(); |
|---|
| 828 | 864 | |
|---|
| 829 | 865 | /* Since the counter is in nano-seconds we use 1GHz frequency */ |
|---|
| 830 | 866 | args->system_clock_freq = 1000000000; |
|---|
| .. | .. |
|---|
| 840 | 876 | struct kfd_process_device_apertures *pAperture; |
|---|
| 841 | 877 | struct kfd_process_device *pdd; |
|---|
| 842 | 878 | |
|---|
| 843 | | - dev_dbg(kfd_device, "get apertures for PASID %d", p->pasid); |
|---|
| 879 | + dev_dbg(kfd_device, "get apertures for PASID 0x%x", p->pasid); |
|---|
| 844 | 880 | |
|---|
| 845 | 881 | args->num_of_nodes = 0; |
|---|
| 846 | 882 | |
|---|
| .. | .. |
|---|
| 898 | 934 | uint32_t nodes = 0; |
|---|
| 899 | 935 | int ret; |
|---|
| 900 | 936 | |
|---|
| 901 | | - dev_dbg(kfd_device, "get apertures for PASID %d", p->pasid); |
|---|
| 937 | + dev_dbg(kfd_device, "get apertures for PASID 0x%x", p->pasid); |
|---|
| 902 | 938 | |
|---|
| 903 | 939 | if (args->num_of_nodes == 0) { |
|---|
| 904 | 940 | /* Return number of nodes, so that user space can alloacate |
|---|
| .. | .. |
|---|
| 1024 | 1060 | } |
|---|
| 1025 | 1061 | mutex_unlock(&p->mutex); |
|---|
| 1026 | 1062 | |
|---|
| 1027 | | - err = kfd->kfd2kgd->map_gtt_bo_to_kernel(kfd->kgd, |
|---|
| 1063 | + err = amdgpu_amdkfd_gpuvm_map_gtt_bo_to_kernel(kfd->kgd, |
|---|
| 1028 | 1064 | mem, &kern_addr, &size); |
|---|
| 1029 | 1065 | if (err) { |
|---|
| 1030 | 1066 | pr_err("Failed to map event page to kernel\n"); |
|---|
| .. | .. |
|---|
| 1113 | 1149 | mutex_unlock(&p->mutex); |
|---|
| 1114 | 1150 | |
|---|
| 1115 | 1151 | if (dev->dqm->sched_policy == KFD_SCHED_POLICY_NO_HWS && |
|---|
| 1116 | | - pdd->qpd.vmid != 0) |
|---|
| 1152 | + pdd->qpd.vmid != 0 && dev->kfd2kgd->set_scratch_backing_va) |
|---|
| 1117 | 1153 | dev->kfd2kgd->set_scratch_backing_va( |
|---|
| 1118 | 1154 | dev->kgd, args->va_addr, pdd->qpd.vmid); |
|---|
| 1119 | 1155 | |
|---|
| .. | .. |
|---|
| 1136 | 1172 | if (!dev) |
|---|
| 1137 | 1173 | return -EINVAL; |
|---|
| 1138 | 1174 | |
|---|
| 1139 | | - dev->kfd2kgd->get_tile_config(dev->kgd, &config); |
|---|
| 1175 | + amdgpu_amdkfd_get_tile_config(dev->kgd, &config); |
|---|
| 1140 | 1176 | |
|---|
| 1141 | 1177 | args->gb_addr_config = config.gb_addr_config; |
|---|
| 1142 | 1178 | args->num_banks = config.num_banks; |
|---|
| .. | .. |
|---|
| 1210 | 1246 | return ret; |
|---|
| 1211 | 1247 | } |
|---|
| 1212 | 1248 | |
|---|
| 1213 | | -static bool kfd_dev_is_large_bar(struct kfd_dev *dev) |
|---|
| 1249 | +bool kfd_dev_is_large_bar(struct kfd_dev *dev) |
|---|
| 1214 | 1250 | { |
|---|
| 1215 | 1251 | struct kfd_local_mem_info mem_info; |
|---|
| 1216 | 1252 | |
|---|
| .. | .. |
|---|
| 1219 | 1255 | return true; |
|---|
| 1220 | 1256 | } |
|---|
| 1221 | 1257 | |
|---|
| 1222 | | - if (dev->device_info->needs_iommu_device) |
|---|
| 1258 | + if (dev->use_iommu_v2) |
|---|
| 1223 | 1259 | return false; |
|---|
| 1224 | 1260 | |
|---|
| 1225 | | - dev->kfd2kgd->get_local_mem_info(dev->kgd, &mem_info); |
|---|
| 1261 | + amdgpu_amdkfd_get_local_mem_info(dev->kgd, &mem_info); |
|---|
| 1226 | 1262 | if (mem_info.local_mem_size_private == 0 && |
|---|
| 1227 | 1263 | mem_info.local_mem_size_public > 0) |
|---|
| 1228 | 1264 | return true; |
|---|
| .. | .. |
|---|
| 1263 | 1299 | goto err_unlock; |
|---|
| 1264 | 1300 | } |
|---|
| 1265 | 1301 | |
|---|
| 1266 | | - err = dev->kfd2kgd->alloc_memory_of_gpu( |
|---|
| 1302 | + if (flags & KFD_IOC_ALLOC_MEM_FLAGS_DOORBELL) { |
|---|
| 1303 | + if (args->size != kfd_doorbell_process_slice(dev)) { |
|---|
| 1304 | + err = -EINVAL; |
|---|
| 1305 | + goto err_unlock; |
|---|
| 1306 | + } |
|---|
| 1307 | + offset = kfd_get_process_doorbells(pdd); |
|---|
| 1308 | + } else if (flags & KFD_IOC_ALLOC_MEM_FLAGS_MMIO_REMAP) { |
|---|
| 1309 | + if (args->size != PAGE_SIZE) { |
|---|
| 1310 | + err = -EINVAL; |
|---|
| 1311 | + goto err_unlock; |
|---|
| 1312 | + } |
|---|
| 1313 | + offset = amdgpu_amdkfd_get_mmio_remap_phys_addr(dev->kgd); |
|---|
| 1314 | + if (!offset) { |
|---|
| 1315 | + err = -ENOMEM; |
|---|
| 1316 | + goto err_unlock; |
|---|
| 1317 | + } |
|---|
| 1318 | + } |
|---|
| 1319 | + |
|---|
| 1320 | + err = amdgpu_amdkfd_gpuvm_alloc_memory_of_gpu( |
|---|
| 1267 | 1321 | dev->kgd, args->va_addr, args->size, |
|---|
| 1268 | 1322 | pdd->vm, (struct kgd_mem **) &mem, &offset, |
|---|
| 1269 | 1323 | flags); |
|---|
| .. | .. |
|---|
| 1277 | 1331 | goto err_free; |
|---|
| 1278 | 1332 | } |
|---|
| 1279 | 1333 | |
|---|
| 1334 | + /* Update the VRAM usage count */ |
|---|
| 1335 | + if (flags & KFD_IOC_ALLOC_MEM_FLAGS_VRAM) |
|---|
| 1336 | + WRITE_ONCE(pdd->vram_usage, pdd->vram_usage + args->size); |
|---|
| 1337 | + |
|---|
| 1280 | 1338 | mutex_unlock(&p->mutex); |
|---|
| 1281 | 1339 | |
|---|
| 1282 | 1340 | args->handle = MAKE_HANDLE(args->gpu_id, idr_handle); |
|---|
| 1283 | 1341 | args->mmap_offset = offset; |
|---|
| 1284 | 1342 | |
|---|
| 1343 | + /* MMIO is mapped through kfd device |
|---|
| 1344 | + * Generate a kfd mmap offset |
|---|
| 1345 | + */ |
|---|
| 1346 | + if (flags & KFD_IOC_ALLOC_MEM_FLAGS_MMIO_REMAP) |
|---|
| 1347 | + args->mmap_offset = KFD_MMAP_TYPE_MMIO |
|---|
| 1348 | + | KFD_MMAP_GPU_ID(args->gpu_id); |
|---|
| 1349 | + |
|---|
| 1285 | 1350 | return 0; |
|---|
| 1286 | 1351 | |
|---|
| 1287 | 1352 | err_free: |
|---|
| 1288 | | - dev->kfd2kgd->free_memory_of_gpu(dev->kgd, (struct kgd_mem *)mem); |
|---|
| 1353 | + amdgpu_amdkfd_gpuvm_free_memory_of_gpu(dev->kgd, (struct kgd_mem *)mem, NULL); |
|---|
| 1289 | 1354 | err_unlock: |
|---|
| 1290 | 1355 | mutex_unlock(&p->mutex); |
|---|
| 1291 | 1356 | return err; |
|---|
| .. | .. |
|---|
| 1299 | 1364 | void *mem; |
|---|
| 1300 | 1365 | struct kfd_dev *dev; |
|---|
| 1301 | 1366 | int ret; |
|---|
| 1367 | + uint64_t size = 0; |
|---|
| 1302 | 1368 | |
|---|
| 1303 | 1369 | dev = kfd_device_by_id(GET_GPU_ID(args->handle)); |
|---|
| 1304 | 1370 | if (!dev) |
|---|
| .. | .. |
|---|
| 1320 | 1386 | goto err_unlock; |
|---|
| 1321 | 1387 | } |
|---|
| 1322 | 1388 | |
|---|
| 1323 | | - ret = dev->kfd2kgd->free_memory_of_gpu(dev->kgd, (struct kgd_mem *)mem); |
|---|
| 1389 | + ret = amdgpu_amdkfd_gpuvm_free_memory_of_gpu(dev->kgd, |
|---|
| 1390 | + (struct kgd_mem *)mem, &size); |
|---|
| 1324 | 1391 | |
|---|
| 1325 | 1392 | /* If freeing the buffer failed, leave the handle in place for |
|---|
| 1326 | 1393 | * clean-up during process tear-down. |
|---|
| .. | .. |
|---|
| 1328 | 1395 | if (!ret) |
|---|
| 1329 | 1396 | kfd_process_device_remove_obj_handle( |
|---|
| 1330 | 1397 | pdd, GET_IDR_HANDLE(args->handle)); |
|---|
| 1398 | + |
|---|
| 1399 | + WRITE_ONCE(pdd->vram_usage, pdd->vram_usage - size); |
|---|
| 1331 | 1400 | |
|---|
| 1332 | 1401 | err_unlock: |
|---|
| 1333 | 1402 | mutex_unlock(&p->mutex); |
|---|
| .. | .. |
|---|
| 1400 | 1469 | err = PTR_ERR(peer_pdd); |
|---|
| 1401 | 1470 | goto get_mem_obj_from_handle_failed; |
|---|
| 1402 | 1471 | } |
|---|
| 1403 | | - err = peer->kfd2kgd->map_memory_to_gpu( |
|---|
| 1472 | + err = amdgpu_amdkfd_gpuvm_map_memory_to_gpu( |
|---|
| 1404 | 1473 | peer->kgd, (struct kgd_mem *)mem, peer_pdd->vm); |
|---|
| 1405 | 1474 | if (err) { |
|---|
| 1406 | 1475 | pr_err("Failed to map to gpu %d/%d\n", |
|---|
| .. | .. |
|---|
| 1412 | 1481 | |
|---|
| 1413 | 1482 | mutex_unlock(&p->mutex); |
|---|
| 1414 | 1483 | |
|---|
| 1415 | | - err = dev->kfd2kgd->sync_memory(dev->kgd, (struct kgd_mem *) mem, true); |
|---|
| 1484 | + err = amdgpu_amdkfd_gpuvm_sync_memory(dev->kgd, (struct kgd_mem *) mem, true); |
|---|
| 1416 | 1485 | if (err) { |
|---|
| 1417 | 1486 | pr_debug("Sync memory failed, wait interrupted by user signal\n"); |
|---|
| 1418 | 1487 | goto sync_memory_failed; |
|---|
| .. | .. |
|---|
| 1507 | 1576 | err = -ENODEV; |
|---|
| 1508 | 1577 | goto get_mem_obj_from_handle_failed; |
|---|
| 1509 | 1578 | } |
|---|
| 1510 | | - err = dev->kfd2kgd->unmap_memory_to_gpu( |
|---|
| 1579 | + err = amdgpu_amdkfd_gpuvm_unmap_memory_from_gpu( |
|---|
| 1511 | 1580 | peer->kgd, (struct kgd_mem *)mem, peer_pdd->vm); |
|---|
| 1512 | 1581 | if (err) { |
|---|
| 1513 | 1582 | pr_err("Failed to unmap from gpu %d/%d\n", |
|---|
| .. | .. |
|---|
| 1529 | 1598 | copy_from_user_failed: |
|---|
| 1530 | 1599 | kfree(devices_arr); |
|---|
| 1531 | 1600 | return err; |
|---|
| 1601 | +} |
|---|
| 1602 | + |
|---|
| 1603 | +static int kfd_ioctl_alloc_queue_gws(struct file *filep, |
|---|
| 1604 | + struct kfd_process *p, void *data) |
|---|
| 1605 | +{ |
|---|
| 1606 | + int retval; |
|---|
| 1607 | + struct kfd_ioctl_alloc_queue_gws_args *args = data; |
|---|
| 1608 | + struct queue *q; |
|---|
| 1609 | + struct kfd_dev *dev; |
|---|
| 1610 | + |
|---|
| 1611 | + mutex_lock(&p->mutex); |
|---|
| 1612 | + q = pqm_get_user_queue(&p->pqm, args->queue_id); |
|---|
| 1613 | + |
|---|
| 1614 | + if (q) { |
|---|
| 1615 | + dev = q->device; |
|---|
| 1616 | + } else { |
|---|
| 1617 | + retval = -EINVAL; |
|---|
| 1618 | + goto out_unlock; |
|---|
| 1619 | + } |
|---|
| 1620 | + |
|---|
| 1621 | + if (!dev->gws) { |
|---|
| 1622 | + retval = -ENODEV; |
|---|
| 1623 | + goto out_unlock; |
|---|
| 1624 | + } |
|---|
| 1625 | + |
|---|
| 1626 | + if (dev->dqm->sched_policy == KFD_SCHED_POLICY_NO_HWS) { |
|---|
| 1627 | + retval = -ENODEV; |
|---|
| 1628 | + goto out_unlock; |
|---|
| 1629 | + } |
|---|
| 1630 | + |
|---|
| 1631 | + retval = pqm_set_gws(&p->pqm, args->queue_id, args->num_gws ? dev->gws : NULL); |
|---|
| 1632 | + mutex_unlock(&p->mutex); |
|---|
| 1633 | + |
|---|
| 1634 | + args->first_gws = 0; |
|---|
| 1635 | + return retval; |
|---|
| 1636 | + |
|---|
| 1637 | +out_unlock: |
|---|
| 1638 | + mutex_unlock(&p->mutex); |
|---|
| 1639 | + return retval; |
|---|
| 1640 | +} |
|---|
| 1641 | + |
|---|
| 1642 | +static int kfd_ioctl_get_dmabuf_info(struct file *filep, |
|---|
| 1643 | + struct kfd_process *p, void *data) |
|---|
| 1644 | +{ |
|---|
| 1645 | + struct kfd_ioctl_get_dmabuf_info_args *args = data; |
|---|
| 1646 | + struct kfd_dev *dev = NULL; |
|---|
| 1647 | + struct kgd_dev *dma_buf_kgd; |
|---|
| 1648 | + void *metadata_buffer = NULL; |
|---|
| 1649 | + uint32_t flags; |
|---|
| 1650 | + unsigned int i; |
|---|
| 1651 | + int r; |
|---|
| 1652 | + |
|---|
| 1653 | + /* Find a KFD GPU device that supports the get_dmabuf_info query */ |
|---|
| 1654 | + for (i = 0; kfd_topology_enum_kfd_devices(i, &dev) == 0; i++) |
|---|
| 1655 | + if (dev) |
|---|
| 1656 | + break; |
|---|
| 1657 | + if (!dev) |
|---|
| 1658 | + return -EINVAL; |
|---|
| 1659 | + |
|---|
| 1660 | + if (args->metadata_ptr) { |
|---|
| 1661 | + metadata_buffer = kzalloc(args->metadata_size, GFP_KERNEL); |
|---|
| 1662 | + if (!metadata_buffer) |
|---|
| 1663 | + return -ENOMEM; |
|---|
| 1664 | + } |
|---|
| 1665 | + |
|---|
| 1666 | + /* Get dmabuf info from KGD */ |
|---|
| 1667 | + r = amdgpu_amdkfd_get_dmabuf_info(dev->kgd, args->dmabuf_fd, |
|---|
| 1668 | + &dma_buf_kgd, &args->size, |
|---|
| 1669 | + metadata_buffer, args->metadata_size, |
|---|
| 1670 | + &args->metadata_size, &flags); |
|---|
| 1671 | + if (r) |
|---|
| 1672 | + goto exit; |
|---|
| 1673 | + |
|---|
| 1674 | + /* Reverse-lookup gpu_id from kgd pointer */ |
|---|
| 1675 | + dev = kfd_device_by_kgd(dma_buf_kgd); |
|---|
| 1676 | + if (!dev) { |
|---|
| 1677 | + r = -EINVAL; |
|---|
| 1678 | + goto exit; |
|---|
| 1679 | + } |
|---|
| 1680 | + args->gpu_id = dev->id; |
|---|
| 1681 | + args->flags = flags; |
|---|
| 1682 | + |
|---|
| 1683 | + /* Copy metadata buffer to user mode */ |
|---|
| 1684 | + if (metadata_buffer) { |
|---|
| 1685 | + r = copy_to_user((void __user *)args->metadata_ptr, |
|---|
| 1686 | + metadata_buffer, args->metadata_size); |
|---|
| 1687 | + if (r != 0) |
|---|
| 1688 | + r = -EFAULT; |
|---|
| 1689 | + } |
|---|
| 1690 | + |
|---|
| 1691 | +exit: |
|---|
| 1692 | + kfree(metadata_buffer); |
|---|
| 1693 | + |
|---|
| 1694 | + return r; |
|---|
| 1695 | +} |
|---|
| 1696 | + |
|---|
| 1697 | +static int kfd_ioctl_import_dmabuf(struct file *filep, |
|---|
| 1698 | + struct kfd_process *p, void *data) |
|---|
| 1699 | +{ |
|---|
| 1700 | + struct kfd_ioctl_import_dmabuf_args *args = data; |
|---|
| 1701 | + struct kfd_process_device *pdd; |
|---|
| 1702 | + struct dma_buf *dmabuf; |
|---|
| 1703 | + struct kfd_dev *dev; |
|---|
| 1704 | + int idr_handle; |
|---|
| 1705 | + uint64_t size; |
|---|
| 1706 | + void *mem; |
|---|
| 1707 | + int r; |
|---|
| 1708 | + |
|---|
| 1709 | + dev = kfd_device_by_id(args->gpu_id); |
|---|
| 1710 | + if (!dev) |
|---|
| 1711 | + return -EINVAL; |
|---|
| 1712 | + |
|---|
| 1713 | + dmabuf = dma_buf_get(args->dmabuf_fd); |
|---|
| 1714 | + if (IS_ERR(dmabuf)) |
|---|
| 1715 | + return PTR_ERR(dmabuf); |
|---|
| 1716 | + |
|---|
| 1717 | + mutex_lock(&p->mutex); |
|---|
| 1718 | + |
|---|
| 1719 | + pdd = kfd_bind_process_to_device(dev, p); |
|---|
| 1720 | + if (IS_ERR(pdd)) { |
|---|
| 1721 | + r = PTR_ERR(pdd); |
|---|
| 1722 | + goto err_unlock; |
|---|
| 1723 | + } |
|---|
| 1724 | + |
|---|
| 1725 | + r = amdgpu_amdkfd_gpuvm_import_dmabuf(dev->kgd, dmabuf, |
|---|
| 1726 | + args->va_addr, pdd->vm, |
|---|
| 1727 | + (struct kgd_mem **)&mem, &size, |
|---|
| 1728 | + NULL); |
|---|
| 1729 | + if (r) |
|---|
| 1730 | + goto err_unlock; |
|---|
| 1731 | + |
|---|
| 1732 | + idr_handle = kfd_process_device_create_obj_handle(pdd, mem); |
|---|
| 1733 | + if (idr_handle < 0) { |
|---|
| 1734 | + r = -EFAULT; |
|---|
| 1735 | + goto err_free; |
|---|
| 1736 | + } |
|---|
| 1737 | + |
|---|
| 1738 | + mutex_unlock(&p->mutex); |
|---|
| 1739 | + dma_buf_put(dmabuf); |
|---|
| 1740 | + |
|---|
| 1741 | + args->handle = MAKE_HANDLE(args->gpu_id, idr_handle); |
|---|
| 1742 | + |
|---|
| 1743 | + return 0; |
|---|
| 1744 | + |
|---|
| 1745 | +err_free: |
|---|
| 1746 | + amdgpu_amdkfd_gpuvm_free_memory_of_gpu(dev->kgd, (struct kgd_mem *)mem, NULL); |
|---|
| 1747 | +err_unlock: |
|---|
| 1748 | + mutex_unlock(&p->mutex); |
|---|
| 1749 | + dma_buf_put(dmabuf); |
|---|
| 1750 | + return r; |
|---|
| 1751 | +} |
|---|
| 1752 | + |
|---|
| 1753 | +/* Handle requests for watching SMI events */ |
|---|
| 1754 | +static int kfd_ioctl_smi_events(struct file *filep, |
|---|
| 1755 | + struct kfd_process *p, void *data) |
|---|
| 1756 | +{ |
|---|
| 1757 | + struct kfd_ioctl_smi_events_args *args = data; |
|---|
| 1758 | + struct kfd_dev *dev; |
|---|
| 1759 | + |
|---|
| 1760 | + dev = kfd_device_by_id(args->gpuid); |
|---|
| 1761 | + if (!dev) |
|---|
| 1762 | + return -EINVAL; |
|---|
| 1763 | + |
|---|
| 1764 | + return kfd_smi_event_open(dev, &args->anon_fd); |
|---|
| 1532 | 1765 | } |
|---|
| 1533 | 1766 | |
|---|
| 1534 | 1767 | #define AMDKFD_IOCTL_DEF(ioctl, _func, _flags) \ |
|---|
| .. | .. |
|---|
| 1615 | 1848 | AMDKFD_IOCTL_DEF(AMDKFD_IOC_SET_CU_MASK, |
|---|
| 1616 | 1849 | kfd_ioctl_set_cu_mask, 0), |
|---|
| 1617 | 1850 | |
|---|
| 1851 | + AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_QUEUE_WAVE_STATE, |
|---|
| 1852 | + kfd_ioctl_get_queue_wave_state, 0), |
|---|
| 1853 | + |
|---|
| 1854 | + AMDKFD_IOCTL_DEF(AMDKFD_IOC_GET_DMABUF_INFO, |
|---|
| 1855 | + kfd_ioctl_get_dmabuf_info, 0), |
|---|
| 1856 | + |
|---|
| 1857 | + AMDKFD_IOCTL_DEF(AMDKFD_IOC_IMPORT_DMABUF, |
|---|
| 1858 | + kfd_ioctl_import_dmabuf, 0), |
|---|
| 1859 | + |
|---|
| 1860 | + AMDKFD_IOCTL_DEF(AMDKFD_IOC_ALLOC_QUEUE_GWS, |
|---|
| 1861 | + kfd_ioctl_alloc_queue_gws, 0), |
|---|
| 1862 | + |
|---|
| 1863 | + AMDKFD_IOCTL_DEF(AMDKFD_IOC_SMI_EVENTS, |
|---|
| 1864 | + kfd_ioctl_smi_events, 0), |
|---|
| 1618 | 1865 | }; |
|---|
| 1619 | 1866 | |
|---|
| 1620 | 1867 | #define AMDKFD_CORE_IOCTL_COUNT ARRAY_SIZE(amdkfd_ioctls) |
|---|
| .. | .. |
|---|
| 1647 | 1894 | } else |
|---|
| 1648 | 1895 | goto err_i1; |
|---|
| 1649 | 1896 | |
|---|
| 1650 | | - dev_dbg(kfd_device, "ioctl cmd 0x%x (#%d), arg 0x%lx\n", cmd, nr, arg); |
|---|
| 1897 | + dev_dbg(kfd_device, "ioctl cmd 0x%x (#0x%x), arg 0x%lx\n", cmd, nr, arg); |
|---|
| 1651 | 1898 | |
|---|
| 1652 | | - process = kfd_get_process(current); |
|---|
| 1653 | | - if (IS_ERR(process)) { |
|---|
| 1654 | | - dev_dbg(kfd_device, "no process\n"); |
|---|
| 1899 | + /* Get the process struct from the filep. Only the process |
|---|
| 1900 | + * that opened /dev/kfd can use the file descriptor. Child |
|---|
| 1901 | + * processes need to create their own KFD device context. |
|---|
| 1902 | + */ |
|---|
| 1903 | + process = filep->private_data; |
|---|
| 1904 | + if (process->lead_thread != current->group_leader) { |
|---|
| 1905 | + dev_dbg(kfd_device, "Using KFD FD in wrong process\n"); |
|---|
| 1906 | + retcode = -EBADF; |
|---|
| 1655 | 1907 | goto err_i1; |
|---|
| 1656 | 1908 | } |
|---|
| 1657 | 1909 | |
|---|
| .. | .. |
|---|
| 1702 | 1954 | kfree(kdata); |
|---|
| 1703 | 1955 | |
|---|
| 1704 | 1956 | if (retcode) |
|---|
| 1705 | | - dev_dbg(kfd_device, "ret = %d\n", retcode); |
|---|
| 1957 | + dev_dbg(kfd_device, "ioctl cmd (#0x%x), arg 0x%lx, ret = %d\n", |
|---|
| 1958 | + nr, arg, retcode); |
|---|
| 1706 | 1959 | |
|---|
| 1707 | 1960 | return retcode; |
|---|
| 1708 | 1961 | } |
|---|
| 1962 | + |
|---|
| 1963 | +static int kfd_mmio_mmap(struct kfd_dev *dev, struct kfd_process *process, |
|---|
| 1964 | + struct vm_area_struct *vma) |
|---|
| 1965 | +{ |
|---|
| 1966 | + phys_addr_t address; |
|---|
| 1967 | + int ret; |
|---|
| 1968 | + |
|---|
| 1969 | + if (vma->vm_end - vma->vm_start != PAGE_SIZE) |
|---|
| 1970 | + return -EINVAL; |
|---|
| 1971 | + |
|---|
| 1972 | + address = amdgpu_amdkfd_get_mmio_remap_phys_addr(dev->kgd); |
|---|
| 1973 | + |
|---|
| 1974 | + vma->vm_flags |= VM_IO | VM_DONTCOPY | VM_DONTEXPAND | VM_NORESERVE | |
|---|
| 1975 | + VM_DONTDUMP | VM_PFNMAP; |
|---|
| 1976 | + |
|---|
| 1977 | + vma->vm_page_prot = pgprot_noncached(vma->vm_page_prot); |
|---|
| 1978 | + |
|---|
| 1979 | + pr_debug("pasid 0x%x mapping mmio page\n" |
|---|
| 1980 | + " target user address == 0x%08llX\n" |
|---|
| 1981 | + " physical address == 0x%08llX\n" |
|---|
| 1982 | + " vm_flags == 0x%04lX\n" |
|---|
| 1983 | + " size == 0x%04lX\n", |
|---|
| 1984 | + process->pasid, (unsigned long long) vma->vm_start, |
|---|
| 1985 | + address, vma->vm_flags, PAGE_SIZE); |
|---|
| 1986 | + |
|---|
| 1987 | + ret = io_remap_pfn_range(vma, |
|---|
| 1988 | + vma->vm_start, |
|---|
| 1989 | + address >> PAGE_SHIFT, |
|---|
| 1990 | + PAGE_SIZE, |
|---|
| 1991 | + vma->vm_page_prot); |
|---|
| 1992 | + return ret; |
|---|
| 1993 | +} |
|---|
| 1994 | + |
|---|
| 1709 | 1995 | |
|---|
| 1710 | 1996 | static int kfd_mmap(struct file *filp, struct vm_area_struct *vma) |
|---|
| 1711 | 1997 | { |
|---|
| 1712 | 1998 | struct kfd_process *process; |
|---|
| 1713 | 1999 | struct kfd_dev *dev = NULL; |
|---|
| 1714 | | - unsigned long vm_pgoff; |
|---|
| 2000 | + unsigned long mmap_offset; |
|---|
| 1715 | 2001 | unsigned int gpu_id; |
|---|
| 1716 | 2002 | |
|---|
| 1717 | 2003 | process = kfd_get_process(current); |
|---|
| 1718 | 2004 | if (IS_ERR(process)) |
|---|
| 1719 | 2005 | return PTR_ERR(process); |
|---|
| 1720 | 2006 | |
|---|
| 1721 | | - vm_pgoff = vma->vm_pgoff; |
|---|
| 1722 | | - vma->vm_pgoff = KFD_MMAP_OFFSET_VALUE_GET(vm_pgoff); |
|---|
| 1723 | | - gpu_id = KFD_MMAP_GPU_ID_GET(vm_pgoff); |
|---|
| 2007 | + mmap_offset = vma->vm_pgoff << PAGE_SHIFT; |
|---|
| 2008 | + gpu_id = KFD_MMAP_GET_GPU_ID(mmap_offset); |
|---|
| 1724 | 2009 | if (gpu_id) |
|---|
| 1725 | 2010 | dev = kfd_device_by_id(gpu_id); |
|---|
| 1726 | 2011 | |
|---|
| 1727 | | - switch (vm_pgoff & KFD_MMAP_TYPE_MASK) { |
|---|
| 2012 | + switch (mmap_offset & KFD_MMAP_TYPE_MASK) { |
|---|
| 1728 | 2013 | case KFD_MMAP_TYPE_DOORBELL: |
|---|
| 1729 | 2014 | if (!dev) |
|---|
| 1730 | 2015 | return -ENODEV; |
|---|
| .. | .. |
|---|
| 1737 | 2022 | if (!dev) |
|---|
| 1738 | 2023 | return -ENODEV; |
|---|
| 1739 | 2024 | return kfd_reserved_mem_mmap(dev, process, vma); |
|---|
| 2025 | + case KFD_MMAP_TYPE_MMIO: |
|---|
| 2026 | + if (!dev) |
|---|
| 2027 | + return -ENODEV; |
|---|
| 2028 | + return kfd_mmio_mmap(dev, process, vma); |
|---|
| 1740 | 2029 | } |
|---|
| 1741 | 2030 | |
|---|
| 1742 | 2031 | return -EFAULT; |
|---|