diff options
Diffstat (limited to 'drivers/gpu/drm/amd/amdgpu/amdgpu_gem.c')
| -rw-r--r-- | drivers/gpu/drm/amd/amdgpu/amdgpu_gem.c | 230 | 
1 files changed, 168 insertions, 62 deletions
| diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_gem.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_gem.c index 0ecc88df7208..b7ebae289bea 100644 --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_gem.c +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_gem.c @@ -317,7 +317,7 @@ static int amdgpu_gem_object_open(struct drm_gem_object *obj,  	 */  	if (!vm->is_compute_context || !vm->process_info)  		return 0; -	if (!obj->import_attach || +	if (!drm_gem_is_imported(obj) ||  	    !dma_buf_is_dynamic(obj->import_attach->dmabuf))  		return 0;  	mutex_lock_nested(&vm->process_info->lock, 1); @@ -329,7 +329,7 @@ static int amdgpu_gem_object_open(struct drm_gem_object *obj,  			dev_warn(adev->dev, "validate_and_fence failed: %d\n", r);  			if (ti) { -				dev_warn(adev->dev, "pid %d\n", ti->pid); +				dev_warn(adev->dev, "pid %d\n", ti->task.pid);  				amdgpu_vm_put_task_info(ti);  			}  		} @@ -443,15 +443,7 @@ int amdgpu_gem_create_ioctl(struct drm_device *dev, void *data,  	int r;  	/* reject invalid gem flags */ -	if (flags & ~(AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED | -		      AMDGPU_GEM_CREATE_NO_CPU_ACCESS | -		      AMDGPU_GEM_CREATE_CPU_GTT_USWC | -		      AMDGPU_GEM_CREATE_VRAM_CLEARED | -		      AMDGPU_GEM_CREATE_VM_ALWAYS_VALID | -		      AMDGPU_GEM_CREATE_EXPLICIT_SYNC | -		      AMDGPU_GEM_CREATE_ENCRYPTED | -		      AMDGPU_GEM_CREATE_GFX12_DCC | -		      AMDGPU_GEM_CREATE_DISCARDABLE)) +	if (flags & ~AMDGPU_GEM_CREATE_SETTABLE_MASK)  		return -EINVAL;  	/* reject invalid gem domains */ @@ -466,6 +458,9 @@ int amdgpu_gem_create_ioctl(struct drm_device *dev, void *data,  	/* always clear VRAM */  	flags |= AMDGPU_GEM_CREATE_VRAM_CLEARED; +	if (args->in.domains & AMDGPU_GEM_DOMAIN_MMIO_REMAP) +		return -EINVAL; +  	/* create a gem object to contain this object in */  	if (args->in.domains & (AMDGPU_GEM_DOMAIN_GDS |  	    AMDGPU_GEM_DOMAIN_GWS | AMDGPU_GEM_DOMAIN_OA)) { @@ -577,8 +572,7 @@ int amdgpu_gem_userptr_ioctl(struct drm_device *dev, void *data,  		goto release_object;  	if (args->flags & AMDGPU_GEM_USERPTR_VALIDATE) { -		r = amdgpu_ttm_tt_get_user_pages(bo, bo->tbo.ttm->pages, -						 &range); +		r = amdgpu_ttm_tt_get_user_pages(bo, &range);  		if (r)  			goto release_object; @@ -586,6 +580,8 @@ int amdgpu_gem_userptr_ioctl(struct drm_device *dev, void *data,  		if (r)  			goto user_pages_done; +		amdgpu_ttm_tt_set_user_pages(bo->tbo.ttm, range); +  		amdgpu_bo_placement_from_domain(bo, AMDGPU_GEM_DOMAIN_GTT);  		r = ttm_bo_validate(&bo->tbo, &bo->placement, &ctx);  		amdgpu_bo_unreserve(bo); @@ -791,36 +787,6 @@ error:  	return fence;  } -/** - * amdgpu_gem_va_map_flags - map GEM UAPI flags into hardware flags - * - * @adev: amdgpu_device pointer - * @flags: GEM UAPI flags - * - * Returns the GEM UAPI flags mapped into hardware for the ASIC. - */ -uint64_t amdgpu_gem_va_map_flags(struct amdgpu_device *adev, uint32_t flags) -{ -	uint64_t pte_flag = 0; - -	if (flags & AMDGPU_VM_PAGE_EXECUTABLE) -		pte_flag |= AMDGPU_PTE_EXECUTABLE; -	if (flags & AMDGPU_VM_PAGE_READABLE) -		pte_flag |= AMDGPU_PTE_READABLE; -	if (flags & AMDGPU_VM_PAGE_WRITEABLE) -		pte_flag |= AMDGPU_PTE_WRITEABLE; -	if (flags & AMDGPU_VM_PAGE_PRT) -		pte_flag |= AMDGPU_PTE_PRT_FLAG(adev); -	if (flags & AMDGPU_VM_PAGE_NOALLOC) -		pte_flag |= AMDGPU_PTE_NOALLOC; - -	if (adev->gmc.gmc_funcs->map_mtype) -		pte_flag |= amdgpu_gmc_map_mtype(adev, -						 flags & AMDGPU_VM_MTYPE_MASK); - -	return pte_flag; -} -  int amdgpu_gem_va_ioctl(struct drm_device *dev, void *data,  			  struct drm_file *filp)  { @@ -841,7 +807,6 @@ int amdgpu_gem_va_ioctl(struct drm_device *dev, void *data,  	struct dma_fence_chain *timeline_chain = NULL;  	struct dma_fence *fence;  	struct drm_exec exec; -	uint64_t va_flags;  	uint64_t vm_size;  	int r = 0; @@ -945,10 +910,9 @@ int amdgpu_gem_va_ioctl(struct drm_device *dev, void *data,  	switch (args->operation) {  	case AMDGPU_VA_OP_MAP: -		va_flags = amdgpu_gem_va_map_flags(adev, args->flags);  		r = amdgpu_vm_bo_map(adev, bo_va, args->va_address,  				     args->offset_in_bo, args->map_size, -				     va_flags); +				     args->flags);  		break;  	case AMDGPU_VA_OP_UNMAP:  		r = amdgpu_vm_bo_unmap(adev, bo_va, args->va_address); @@ -960,10 +924,9 @@ int amdgpu_gem_va_ioctl(struct drm_device *dev, void *data,  						args->map_size);  		break;  	case AMDGPU_VA_OP_REPLACE: -		va_flags = amdgpu_gem_va_map_flags(adev, args->flags);  		r = amdgpu_vm_bo_replace_map(adev, bo_va, args->va_address,  					     args->offset_in_bo, args->map_size, -					     va_flags); +					     args->flags);  		break;  	default:  		break; @@ -997,17 +960,34 @@ int amdgpu_gem_op_ioctl(struct drm_device *dev, void *data,  	struct drm_gem_object *gobj;  	struct amdgpu_vm_bo_base *base;  	struct amdgpu_bo *robj; +	struct drm_exec exec; +	struct amdgpu_fpriv *fpriv = filp->driver_priv;  	int r; +	if (args->padding) +		return -EINVAL; +  	gobj = drm_gem_object_lookup(filp, args->handle);  	if (!gobj)  		return -ENOENT;  	robj = gem_to_amdgpu_bo(gobj); -	r = amdgpu_bo_reserve(robj, false); -	if (unlikely(r)) -		goto out; +	drm_exec_init(&exec, DRM_EXEC_INTERRUPTIBLE_WAIT | +			  DRM_EXEC_IGNORE_DUPLICATES, 0); +	drm_exec_until_all_locked(&exec) { +		r = drm_exec_lock_obj(&exec, gobj); +		drm_exec_retry_on_contention(&exec); +		if (r) +			goto out_exec; + +		if (args->op == AMDGPU_GEM_OP_GET_MAPPING_INFO) { +			r = amdgpu_vm_lock_pd(&fpriv->vm, &exec, 0); +			drm_exec_retry_on_contention(&exec); +			if (r) +				goto out_exec; +		} +	}  	switch (args->op) {  	case AMDGPU_GEM_OP_GET_GEM_CREATE_INFO: { @@ -1018,29 +998,26 @@ int amdgpu_gem_op_ioctl(struct drm_device *dev, void *data,  		info.alignment = robj->tbo.page_alignment << PAGE_SHIFT;  		info.domains = robj->preferred_domains;  		info.domain_flags = robj->flags; -		amdgpu_bo_unreserve(robj); +		drm_exec_fini(&exec);  		if (copy_to_user(out, &info, sizeof(info)))  			r = -EFAULT;  		break;  	}  	case AMDGPU_GEM_OP_SET_PLACEMENT: -		if (robj->tbo.base.import_attach && +		if (drm_gem_is_imported(&robj->tbo.base) &&  		    args->value & AMDGPU_GEM_DOMAIN_VRAM) {  			r = -EINVAL; -			amdgpu_bo_unreserve(robj); -			break; +			goto out_exec;  		}  		if (amdgpu_ttm_tt_get_usermm(robj->tbo.ttm)) {  			r = -EPERM; -			amdgpu_bo_unreserve(robj); -			break; +			goto out_exec;  		}  		for (base = robj->vm_bo; base; base = base->next)  			if (amdgpu_xgmi_same_hive(amdgpu_ttm_adev(robj->tbo.bdev),  				amdgpu_ttm_adev(base->vm->root.bo->tbo.bdev))) {  				r = -EINVAL; -				amdgpu_bo_unreserve(robj); -				goto out; +				goto out_exec;  			} @@ -1053,17 +1030,146 @@ int amdgpu_gem_op_ioctl(struct drm_device *dev, void *data,  		if (robj->flags & AMDGPU_GEM_CREATE_VM_ALWAYS_VALID)  			amdgpu_vm_bo_invalidate(robj, true); +		drm_exec_fini(&exec); +		break; +	case AMDGPU_GEM_OP_GET_MAPPING_INFO: { +		struct amdgpu_bo_va *bo_va = amdgpu_vm_bo_find(&fpriv->vm, robj); +		struct drm_amdgpu_gem_vm_entry *vm_entries; +		struct amdgpu_bo_va_mapping *mapping; +		int num_mappings = 0; +		/* +		 * num_entries is set as an input to the size of the user-allocated array of +		 * drm_amdgpu_gem_vm_entry stored at args->value. +		 * num_entries is sent back as output as the number of mappings the bo has. +		 * If that number is larger than the size of the array, the ioctl must +		 * be retried. +		 */ +		vm_entries = kvcalloc(args->num_entries, sizeof(*vm_entries), GFP_KERNEL); +		if (!vm_entries) +			return -ENOMEM; + +		amdgpu_vm_bo_va_for_each_valid_mapping(bo_va, mapping) { +			if (num_mappings < args->num_entries) { +				vm_entries[num_mappings].addr = mapping->start * AMDGPU_GPU_PAGE_SIZE; +				vm_entries[num_mappings].size = (mapping->last - mapping->start + 1) * AMDGPU_GPU_PAGE_SIZE; +				vm_entries[num_mappings].offset = mapping->offset; +				vm_entries[num_mappings].flags = mapping->flags; +			} +			num_mappings += 1; +		} + +		amdgpu_vm_bo_va_for_each_invalid_mapping(bo_va, mapping) { +			if (num_mappings < args->num_entries) { +				vm_entries[num_mappings].addr = mapping->start * AMDGPU_GPU_PAGE_SIZE; +				vm_entries[num_mappings].size = (mapping->last - mapping->start + 1) * AMDGPU_GPU_PAGE_SIZE; +				vm_entries[num_mappings].offset = mapping->offset; +				vm_entries[num_mappings].flags = mapping->flags; +			} +			num_mappings += 1; +		} + +		drm_exec_fini(&exec); + +		if (num_mappings > 0 && num_mappings <= args->num_entries) +			if (copy_to_user(u64_to_user_ptr(args->value), vm_entries, num_mappings * sizeof(*vm_entries))) +				r = -EFAULT; + +		args->num_entries = num_mappings; -		amdgpu_bo_unreserve(robj); +		kvfree(vm_entries);  		break; +	}  	default: -		amdgpu_bo_unreserve(robj); +		drm_exec_fini(&exec);  		r = -EINVAL;  	} -out:  	drm_gem_object_put(gobj);  	return r; +out_exec: +	drm_exec_fini(&exec); +	drm_gem_object_put(gobj); +	return r; +} + +/** + * amdgpu_gem_list_handles_ioctl - get information about a process' buffer objects + * + * @dev: drm device pointer + * @data: drm_amdgpu_gem_list_handles + * @filp: drm file pointer + * + * num_entries is set as an input to the size of the entries array. + * num_entries is sent back as output as the number of bos in the process. + * If that number is larger than the size of the array, the ioctl must + * be retried. + * + * Returns: + * 0 for success, -errno for errors. + */ +int amdgpu_gem_list_handles_ioctl(struct drm_device *dev, void *data, +				  struct drm_file *filp) +{ +	struct drm_amdgpu_gem_list_handles *args = data; +	struct drm_amdgpu_gem_list_handles_entry *bo_entries; +	struct drm_gem_object *gobj; +	int id, ret = 0; +	int bo_index = 0; +	int num_bos = 0; + +	spin_lock(&filp->table_lock); +	idr_for_each_entry(&filp->object_idr, gobj, id) +		num_bos += 1; +	spin_unlock(&filp->table_lock); + +	if (args->num_entries < num_bos) { +		args->num_entries = num_bos; +		return 0; +	} + +	if (num_bos == 0) { +		args->num_entries = 0; +		return 0; +	} + +	bo_entries = kvcalloc(num_bos, sizeof(*bo_entries), GFP_KERNEL); +	if (!bo_entries) +		return -ENOMEM; + +	spin_lock(&filp->table_lock); +	idr_for_each_entry(&filp->object_idr, gobj, id) { +		struct amdgpu_bo *bo = gem_to_amdgpu_bo(gobj); +		struct drm_amdgpu_gem_list_handles_entry *bo_entry; + +		if (bo_index >= num_bos) { +			ret = -EAGAIN; +			break; +		} + +		bo_entry = &bo_entries[bo_index]; + +		bo_entry->size = amdgpu_bo_size(bo); +		bo_entry->alloc_flags = bo->flags & AMDGPU_GEM_CREATE_SETTABLE_MASK; +		bo_entry->preferred_domains = bo->preferred_domains; +		bo_entry->gem_handle = id; +		bo_entry->alignment = bo->tbo.page_alignment; + +		if (bo->tbo.base.import_attach) +			bo_entry->flags |= AMDGPU_GEM_LIST_HANDLES_FLAG_IS_IMPORT; + +		bo_index += 1; +	} +	spin_unlock(&filp->table_lock); + +	args->num_entries = bo_index; + +	if (!ret) +		if (copy_to_user(u64_to_user_ptr(args->entries), bo_entries, num_bos * sizeof(*bo_entries))) +			ret = -EFAULT; + +	kvfree(bo_entries); + +	return ret;  }  static int amdgpu_gem_align_pitch(struct amdgpu_device *adev, | 
