diff options
| author | Daniel Vetter <daniel.vetter@ffwll.ch> | 2017-11-21 11:33:10 +0100 | 
|---|---|---|
| committer | Daniel Vetter <daniel.vetter@ffwll.ch> | 2017-11-21 14:17:56 +0100 | 
| commit | 70c5f93669249886b151812076509f30569aff80 (patch) | |
| tree | 05dce785f3a70e022b91016c87e4092f143a2fef /drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c | |
| parent | c83ecfa5851f4d35be88f32dabb3a53f51cf5c32 (diff) | |
| parent | f150891fd9878ef0d9197c4e8451ce67c3bdd014 (diff) | |
Merge airlied/drm-next into drm-misc-next
Bake in the conflict between the drm_print.h extraction and the
addition of DRM_DEBUG_LEASES since we lost it a few too many times.
Also fix a new use of drm_plane_helper_check_state in msm to follow
Ville's conversion in
commit a01cb8ba3f6282934cff65e89ab36b18b14cbe27
Author: Ville Syrjälä <ville.syrjala@linux.intel.com>
Date:   Wed Nov 1 22:16:19 2017 +0200
    drm: Move drm_plane_helper_check_state() into drm_atomic_helper.c
Acked-by: Ville Syrjälä <ville.syrjala@linux.intel.com>
Signed-off-by: Daniel Vetter <daniel.vetter@ffwll.ch>
Diffstat (limited to 'drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c')
| -rw-r--r-- | drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c | 225 | 
1 files changed, 148 insertions, 77 deletions
| diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c index c6a214f1e991..f7fceb63413c 100644 --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c @@ -25,6 +25,7 @@   *    Jerome Glisse <glisse@freedesktop.org>   */  #include <linux/pagemap.h> +#include <linux/sync_file.h>  #include <drm/drmP.h>  #include <drm/amdgpu_drm.h>  #include <drm/drm_syncobj.h> @@ -89,12 +90,14 @@ static int amdgpu_cs_parser_init(struct amdgpu_cs_parser *p, void *data)  		goto free_chunk;  	} +	mutex_lock(&p->ctx->lock); +  	/* get chunks */  	chunk_array_user = u64_to_user_ptr(cs->in.chunks);  	if (copy_from_user(chunk_array, chunk_array_user,  			   sizeof(uint64_t)*cs->in.num_chunks)) {  		ret = -EFAULT; -		goto put_ctx; +		goto free_chunk;  	}  	p->nchunks = cs->in.num_chunks; @@ -102,7 +105,7 @@ static int amdgpu_cs_parser_init(struct amdgpu_cs_parser *p, void *data)  			    GFP_KERNEL);  	if (!p->chunks) {  		ret = -ENOMEM; -		goto put_ctx; +		goto free_chunk;  	}  	for (i = 0; i < p->nchunks; i++) { @@ -169,6 +172,11 @@ static int amdgpu_cs_parser_init(struct amdgpu_cs_parser *p, void *data)  	if (ret)  		goto free_all_kdata; +	if (p->ctx->vram_lost_counter != p->job->vram_lost_counter) { +		ret = -ECANCELED; +		goto free_all_kdata; +	} +  	if (p->uf_entry.robj)  		p->job->uf_addr = uf_offset;  	kfree(chunk_array); @@ -182,8 +190,6 @@ free_partial_kdata:  	kfree(p->chunks);  	p->chunks = NULL;  	p->nchunks = 0; -put_ctx: -	amdgpu_ctx_put(p->ctx);  free_chunk:  	kfree(chunk_array); @@ -704,7 +710,8 @@ static int amdgpu_cs_sync_rings(struct amdgpu_cs_parser *p)  	list_for_each_entry(e, &p->validated, tv.head) {  		struct reservation_object *resv = e->robj->tbo.resv; -		r = amdgpu_sync_resv(p->adev, &p->job->sync, resv, p->filp); +		r = amdgpu_sync_resv(p->adev, &p->job->sync, resv, p->filp, +				     amdgpu_bo_explicit_sync(e->robj));  		if (r)  			return r; @@ -735,8 +742,10 @@ static void amdgpu_cs_parser_fini(struct amdgpu_cs_parser *parser, int error,  	dma_fence_put(parser->fence); -	if (parser->ctx) +	if (parser->ctx) { +		mutex_unlock(&parser->ctx->lock);  		amdgpu_ctx_put(parser->ctx); +	}  	if (parser->bo_list)  		amdgpu_bo_list_put(parser->bo_list); @@ -843,14 +852,58 @@ static int amdgpu_cs_ib_vm_chunk(struct amdgpu_device *adev,  	struct amdgpu_fpriv *fpriv = p->filp->driver_priv;  	struct amdgpu_vm *vm = &fpriv->vm;  	struct amdgpu_ring *ring = p->job->ring; -	int i, r; +	int r;  	/* Only for UVD/VCE VM emulation */ -	if (ring->funcs->parse_cs) { -		for (i = 0; i < p->job->num_ibs; i++) { -			r = amdgpu_ring_parse_cs(ring, p, i); +	if (p->job->ring->funcs->parse_cs) { +		unsigned i, j; + +		for (i = 0, j = 0; i < p->nchunks && j < p->job->num_ibs; i++) { +			struct drm_amdgpu_cs_chunk_ib *chunk_ib; +			struct amdgpu_bo_va_mapping *m; +			struct amdgpu_bo *aobj = NULL; +			struct amdgpu_cs_chunk *chunk; +			struct amdgpu_ib *ib; +			uint64_t offset; +			uint8_t *kptr; + +			chunk = &p->chunks[i]; +			ib = &p->job->ibs[j]; +			chunk_ib = chunk->kdata; + +			if (chunk->chunk_id != AMDGPU_CHUNK_ID_IB) +				continue; + +			r = amdgpu_cs_find_mapping(p, chunk_ib->va_start, +						   &aobj, &m); +			if (r) { +				DRM_ERROR("IB va_start is invalid\n"); +				return r; +			} + +			if ((chunk_ib->va_start + chunk_ib->ib_bytes) > +			    (m->last + 1) * AMDGPU_GPU_PAGE_SIZE) { +				DRM_ERROR("IB va_start+ib_bytes is invalid\n"); +				return -EINVAL; +			} + +			/* the IB should be reserved at this point */ +			r = amdgpu_bo_kmap(aobj, (void **)&kptr); +			if (r) { +				return r; +			} + +			offset = m->start * AMDGPU_GPU_PAGE_SIZE; +			kptr += chunk_ib->va_start - offset; + +			memcpy(ib->ptr, kptr, chunk_ib->ib_bytes); +			amdgpu_bo_kunmap(aobj); + +			r = amdgpu_ring_parse_cs(ring, p, j);  			if (r)  				return r; + +			j++;  		}  	} @@ -917,54 +970,18 @@ static int amdgpu_cs_ib_fill(struct amdgpu_device *adev,  		parser->job->ring = ring; -		if (ring->funcs->parse_cs) { -			struct amdgpu_bo_va_mapping *m; -			struct amdgpu_bo *aobj = NULL; -			uint64_t offset; -			uint8_t *kptr; - -			r = amdgpu_cs_find_mapping(parser, chunk_ib->va_start, -						   &aobj, &m); -			if (r) { -				DRM_ERROR("IB va_start is invalid\n"); -				return r; -			} - -			if ((chunk_ib->va_start + chunk_ib->ib_bytes) > -			    (m->last + 1) * AMDGPU_GPU_PAGE_SIZE) { -				DRM_ERROR("IB va_start+ib_bytes is invalid\n"); -				return -EINVAL; -			} - -			/* the IB should be reserved at this point */ -			r = amdgpu_bo_kmap(aobj, (void **)&kptr); -			if (r) { -				return r; -			} - -			offset = m->start * AMDGPU_GPU_PAGE_SIZE; -			kptr += chunk_ib->va_start - offset; - -			r =  amdgpu_ib_get(adev, vm, chunk_ib->ib_bytes, ib); -			if (r) { -				DRM_ERROR("Failed to get ib !\n"); -				return r; -			} - -			memcpy(ib->ptr, kptr, chunk_ib->ib_bytes); -			amdgpu_bo_kunmap(aobj); -		} else { -			r =  amdgpu_ib_get(adev, vm, 0, ib); -			if (r) { -				DRM_ERROR("Failed to get ib !\n"); -				return r; -			} - +		r =  amdgpu_ib_get(adev, vm, +					ring->funcs->parse_cs ? chunk_ib->ib_bytes : 0, +					ib); +		if (r) { +			DRM_ERROR("Failed to get ib !\n"); +			return r;  		}  		ib->gpu_addr = chunk_ib->va_start;  		ib->length_dw = chunk_ib->ib_bytes / 4;  		ib->flags = chunk_ib->flags; +  		j++;  	} @@ -974,7 +991,7 @@ static int amdgpu_cs_ib_fill(struct amdgpu_device *adev,  	    parser->job->ring->funcs->type == AMDGPU_RING_TYPE_VCE))  		return -EINVAL; -	return 0; +	return amdgpu_ctx_wait_prev_fence(parser->ctx, parser->job->ring->idx);  }  static int amdgpu_cs_process_fence_dep(struct amdgpu_cs_parser *p, @@ -1175,6 +1192,8 @@ static int amdgpu_cs_submit(struct amdgpu_cs_parser *p,  	job->uf_sequence = seq;  	amdgpu_job_free_resources(job); +	amdgpu_ring_priority_get(job->ring, +				 amd_sched_get_job_priority(&job->base));  	trace_amdgpu_cs_ioctl(job);  	amd_sched_entity_push_job(&job->base); @@ -1188,7 +1207,6 @@ static int amdgpu_cs_submit(struct amdgpu_cs_parser *p,  int amdgpu_cs_ioctl(struct drm_device *dev, void *data, struct drm_file *filp)  {  	struct amdgpu_device *adev = dev->dev_private; -	struct amdgpu_fpriv *fpriv = filp->driver_priv;  	union drm_amdgpu_cs *cs = data;  	struct amdgpu_cs_parser parser = {};  	bool reserved_buffers = false; @@ -1196,8 +1214,6 @@ int amdgpu_cs_ioctl(struct drm_device *dev, void *data, struct drm_file *filp)  	if (!adev->accel_working)  		return -EBUSY; -	if (amdgpu_kms_vram_lost(adev, fpriv)) -		return -ENODEV;  	parser.adev = adev;  	parser.filp = filp; @@ -1208,6 +1224,10 @@ int amdgpu_cs_ioctl(struct drm_device *dev, void *data, struct drm_file *filp)  		goto out;  	} +	r = amdgpu_cs_ib_fill(adev, &parser); +	if (r) +		goto out; +  	r = amdgpu_cs_parser_bos(&parser, data);  	if (r) {  		if (r == -ENOMEM) @@ -1218,9 +1238,6 @@ int amdgpu_cs_ioctl(struct drm_device *dev, void *data, struct drm_file *filp)  	}  	reserved_buffers = true; -	r = amdgpu_cs_ib_fill(adev, &parser); -	if (r) -		goto out;  	r = amdgpu_cs_dependencies(adev, &parser);  	if (r) { @@ -1256,16 +1273,12 @@ int amdgpu_cs_wait_ioctl(struct drm_device *dev, void *data,  {  	union drm_amdgpu_wait_cs *wait = data;  	struct amdgpu_device *adev = dev->dev_private; -	struct amdgpu_fpriv *fpriv = filp->driver_priv;  	unsigned long timeout = amdgpu_gem_timeout(wait->in.timeout);  	struct amdgpu_ring *ring = NULL;  	struct amdgpu_ctx *ctx;  	struct dma_fence *fence;  	long r; -	if (amdgpu_kms_vram_lost(adev, fpriv)) -		return -ENODEV; -  	ctx = amdgpu_ctx_get(filp->driver_priv, wait->in.ctx_id);  	if (ctx == NULL)  		return -EINVAL; @@ -1283,6 +1296,8 @@ int amdgpu_cs_wait_ioctl(struct drm_device *dev, void *data,  		r = PTR_ERR(fence);  	else if (fence) {  		r = dma_fence_wait_timeout(fence, true, timeout); +		if (r > 0 && fence->error) +			r = fence->error;  		dma_fence_put(fence);  	} else  		r = 1; @@ -1330,6 +1345,62 @@ static struct dma_fence *amdgpu_cs_get_fence(struct amdgpu_device *adev,  	return fence;  } +int amdgpu_cs_fence_to_handle_ioctl(struct drm_device *dev, void *data, +				    struct drm_file *filp) +{ +	struct amdgpu_device *adev = dev->dev_private; +	union drm_amdgpu_fence_to_handle *info = data; +	struct dma_fence *fence; +	struct drm_syncobj *syncobj; +	struct sync_file *sync_file; +	int fd, r; + +	fence = amdgpu_cs_get_fence(adev, filp, &info->in.fence); +	if (IS_ERR(fence)) +		return PTR_ERR(fence); + +	switch (info->in.what) { +	case AMDGPU_FENCE_TO_HANDLE_GET_SYNCOBJ: +		r = drm_syncobj_create(&syncobj, 0, fence); +		dma_fence_put(fence); +		if (r) +			return r; +		r = drm_syncobj_get_handle(filp, syncobj, &info->out.handle); +		drm_syncobj_put(syncobj); +		return r; + +	case AMDGPU_FENCE_TO_HANDLE_GET_SYNCOBJ_FD: +		r = drm_syncobj_create(&syncobj, 0, fence); +		dma_fence_put(fence); +		if (r) +			return r; +		r = drm_syncobj_get_fd(syncobj, (int*)&info->out.handle); +		drm_syncobj_put(syncobj); +		return r; + +	case AMDGPU_FENCE_TO_HANDLE_GET_SYNC_FILE_FD: +		fd = get_unused_fd_flags(O_CLOEXEC); +		if (fd < 0) { +			dma_fence_put(fence); +			return fd; +		} + +		sync_file = sync_file_create(fence); +		dma_fence_put(fence); +		if (!sync_file) { +			put_unused_fd(fd); +			return -ENOMEM; +		} + +		fd_install(fd, sync_file->file); +		info->out.handle = fd; +		return 0; + +	default: +		return -EINVAL; +	} +} +  /**   * amdgpu_cs_wait_all_fence - wait on all fences to signal   * @@ -1364,6 +1435,9 @@ static int amdgpu_cs_wait_all_fences(struct amdgpu_device *adev,  		if (r == 0)  			break; + +		if (fence->error) +			return fence->error;  	}  	memset(wait, 0, sizeof(*wait)); @@ -1424,7 +1498,7 @@ out:  	wait->out.status = (r > 0);  	wait->out.first_signaled = first;  	/* set return value 0 to indicate success */ -	r = 0; +	r = array[first]->error;  err_free_fence_array:  	for (i = 0; i < fence_count; i++) @@ -1445,15 +1519,12 @@ int amdgpu_cs_wait_fences_ioctl(struct drm_device *dev, void *data,  				struct drm_file *filp)  {  	struct amdgpu_device *adev = dev->dev_private; -	struct amdgpu_fpriv *fpriv = filp->driver_priv;  	union drm_amdgpu_wait_fences *wait = data;  	uint32_t fence_count = wait->in.fence_count;  	struct drm_amdgpu_fence *fences_user;  	struct drm_amdgpu_fence *fences;  	int r; -	if (amdgpu_kms_vram_lost(adev, fpriv)) -		return -ENODEV;  	/* Get the fences from userspace */  	fences = kmalloc_array(fence_count, sizeof(struct drm_amdgpu_fence),  			GFP_KERNEL); @@ -1511,14 +1582,14 @@ int amdgpu_cs_find_mapping(struct amdgpu_cs_parser *parser,  	if (READ_ONCE((*bo)->tbo.resv->lock.ctx) != &parser->ticket)  		return -EINVAL; -	r = amdgpu_ttm_bind(&(*bo)->tbo, &(*bo)->tbo.mem); -	if (unlikely(r)) -		return r; - -	if ((*bo)->flags & AMDGPU_GEM_CREATE_VRAM_CONTIGUOUS) -		return 0; +	if (!((*bo)->flags & AMDGPU_GEM_CREATE_VRAM_CONTIGUOUS)) { +		(*bo)->flags |= AMDGPU_GEM_CREATE_VRAM_CONTIGUOUS; +		amdgpu_ttm_placement_from_domain(*bo, (*bo)->allowed_domains); +		r = ttm_bo_validate(&(*bo)->tbo, &(*bo)->placement, false, +				    false); +		if (r) +			return r; +	} -	(*bo)->flags |= AMDGPU_GEM_CREATE_VRAM_CONTIGUOUS; -	amdgpu_ttm_placement_from_domain(*bo, (*bo)->allowed_domains); -	return ttm_bo_validate(&(*bo)->tbo, &(*bo)->placement, false, false); +	return amdgpu_ttm_bind(&(*bo)->tbo, &(*bo)->tbo.mem);  } | 
