diff options
Diffstat (limited to 'linux-core')
| -rw-r--r-- | linux-core/i915_gem.c | 178 | 
1 files changed, 133 insertions, 45 deletions
| diff --git a/linux-core/i915_gem.c b/linux-core/i915_gem.c index e795ee77..d630b0b2 100644 --- a/linux-core/i915_gem.c +++ b/linux-core/i915_gem.c @@ -74,6 +74,31 @@ i915_gem_object_free_page_list(struct drm_gem_object *obj)  }  /** + * Ensures that all rendering to the object has completed and the object is + * safe to unbind from the GTT. + */ +static int +i915_gem_object_wait_rendering(struct drm_gem_object *obj) +{ +	struct drm_device *dev = obj->dev; +	struct drm_i915_gem_object *obj_priv = obj->driver_private; +	int ret; + +	/* If there is rendering queued on the buffer being evicted, wait for +	 * it. +	 */ +	if (obj_priv->last_rendering_cookie != 0) { +		ret = i915_wait_irq(dev, obj_priv->last_rendering_cookie); +		if (ret != 0) +			return ret; +		/* Clear it now that we know it's passed. */ +		obj_priv->last_rendering_cookie = 0; +	} + +	return 0; +} + +/**   * Unbinds an object from the GTT aperture.   */  static void @@ -88,6 +113,8 @@ i915_gem_object_unbind(struct drm_gem_object *obj)  	if (obj_priv->gtt_space == NULL)  		return; +	i915_gem_object_wait_rendering(obj); +  	if (obj_priv->agp_mem != NULL) {  		drm_unbind_agp(obj_priv->agp_mem);  		drm_free_agp(obj_priv->agp_mem, obj->size / PAGE_SIZE); @@ -97,8 +124,10 @@ i915_gem_object_unbind(struct drm_gem_object *obj)  	drm_memrange_put_block(obj_priv->gtt_space);  	obj_priv->gtt_space = NULL; +	list_del_init(&obj_priv->gtt_lru_entry);  } +#if 0  static void  i915_gem_dump_page (struct page *page, uint32_t start, uint32_t end, uint32_t bias, uint32_t mark)  { @@ -139,6 +168,39 @@ i915_gem_dump_object (struct drm_gem_object *obj, int len, const char *where, ui  		}  	}  } +#endif + +static int +i915_gem_evict_something(struct drm_device *dev) +{ +	drm_i915_private_t *dev_priv = dev->dev_private; +	struct drm_gem_object *obj; +	struct drm_i915_gem_object *obj_priv; +	int ret; + +	/* Find the LRU buffer. */ +	BUG_ON(!list_empty(&dev_priv->mm.gtt_lru)); +	obj_priv = list_entry(dev_priv->mm.gtt_lru.prev, +			      struct drm_i915_gem_object, +			      gtt_lru_entry); +	obj = obj_priv->obj; + +	/* Only unpinned buffers should be on this list. */ +	BUG_ON(obj_priv->pin_count != 0); + +	/* Do this separately from the wait_rendering in +	 * i915_gem_object_unbind() because we want to catch interrupts and +	 * return. +	 */ +	ret = i915_gem_object_wait_rendering(obj); +	if (ret != 0) +		return ret; + +	/* Wait on the rendering and unbind the buffer. */ +	i915_gem_object_unbind(obj); + +	return 0; +}  /**   * Finds free space in the GTT aperture and binds the object there. @@ -150,7 +212,7 @@ i915_gem_object_bind_to_gtt(struct drm_gem_object *obj, unsigned alignment)  	drm_i915_private_t *dev_priv = dev->dev_private;  	struct drm_i915_gem_object *obj_priv = obj->driver_private;  	struct drm_memrange_node *free_space; -	int page_count, i; +	int page_count, i, ret;  	if (alignment == 0)  		alignment = PAGE_SIZE; @@ -159,18 +221,31 @@ i915_gem_object_bind_to_gtt(struct drm_gem_object *obj, unsigned alignment)  		return -EINVAL;  	} + search_free:  	free_space = drm_memrange_search_free(&dev_priv->mm.gtt_space,  					      obj->size,  					      alignment, 0); -	if (free_space == NULL) -		return -ENOMEM; -	obj_priv->gtt_space = drm_memrange_get_block(free_space, -						     obj->size, -						     alignment); -	if (obj_priv->gtt_space == NULL) -		return -ENOMEM; -	obj_priv->gtt_space->private = obj; -	obj_priv->gtt_offset = obj_priv->gtt_space->start; +	if (free_space != NULL) { +		obj_priv->gtt_space = +			drm_memrange_get_block(free_space, obj->size, +					       alignment); +		if (obj_priv->gtt_space != NULL) { +			obj_priv->gtt_space->private = obj; +			obj_priv->gtt_offset = obj_priv->gtt_space->start; +		} +	} +	if (obj_priv->gtt_space == NULL) { +		/* If the gtt is empty and we're still having trouble +		 * fitting our object in, we're out of memory. +		 */ +		if (list_empty(&dev_priv->mm.gtt_lru)) +			return -ENOMEM; + +		ret = i915_gem_evict_something(dev); +		if (ret != 0) +			return ret; +		goto search_free; +	}  #if WATCH_BUF  	DRM_INFO ("Binding object of size %d at 0x%08x\n", obj->size, obj_priv->gtt_offset); @@ -229,6 +304,7 @@ i915_gem_reloc_and_validate_object(struct drm_gem_object *obj,  				   struct drm_i915_gem_validate_entry *entry)  {  	struct drm_device *dev = obj->dev; +	drm_i915_private_t *dev_priv = dev->dev_private;  	struct drm_i915_gem_relocation_entry reloc;  	struct drm_i915_gem_relocation_entry __user *relocs;  	struct drm_i915_gem_object *obj_priv = obj->driver_private; @@ -244,6 +320,12 @@ i915_gem_reloc_and_validate_object(struct drm_gem_object *obj,  	}  	entry->buffer_offset = obj_priv->gtt_offset; +	if (obj_priv->pin_count == 0) { +		/* Move our buffer to the head of the LRU. */ +		list_del_init(&obj_priv->gtt_lru_entry); +		list_add(&obj_priv->gtt_lru_entry, &dev_priv->mm.gtt_lru); +	} +  	relocs = (struct drm_i915_gem_relocation_entry __user *) (uintptr_t) entry->relocs_ptr;  	/* Apply the relocations, using the GTT aperture to avoid cache  	 * flushing requirements. @@ -285,6 +367,9 @@ i915_gem_reloc_and_validate_object(struct drm_gem_object *obj,  			return -EINVAL;  		} +		if (target_obj_priv->gtt_offset == reloc.presumed_offset) +			continue; +  		/* Map the page containing the relocation we're going to  		 * perform.  		 */ @@ -328,8 +413,8 @@ i915_gem_reloc_and_validate_object(struct drm_gem_object *obj,  	return 0;  } -static int -i915_gem_sync(struct drm_device *dev) +static void +i915_gem_flush(struct drm_device *dev)  {  	drm_i915_private_t *dev_priv = dev->dev_private;  	RING_LOCALS; @@ -338,8 +423,6 @@ i915_gem_sync(struct drm_device *dev)  	OUT_RING(CMD_MI_FLUSH | MI_READ_FLUSH | MI_EXE_FLUSH);  	OUT_RING(0); /* noop */  	ADVANCE_LP_RING(); - -	return i915_quiescent(dev);  }  static int @@ -409,6 +492,7 @@ i915_gem_execbuffer(struct drm_device *dev, void *data,  	struct drm_gem_object **object_list;  	int ret, i;  	uint64_t exec_offset; +	uint32_t cookie;  	LOCK_TEST_WITH_RETURN(dev, file_priv); @@ -418,14 +502,6 @@ i915_gem_execbuffer(struct drm_device *dev, void *data,  #endif  	i915_kernel_lost_context(dev); -	/* Big hammer: flush and idle the hardware so we can map things in/out. -	 */ -	ret = i915_gem_sync(dev); -	if (ret != 0) { -		DRM_ERROR ("i915_gem_sync failed %d\n", ret); -		return ret; -	} -  	/* Copy in the validate list from userland */  	validate_list = drm_calloc(sizeof(*validate_list), args->buffer_count,  				   DRM_MEM_DRIVER); @@ -465,6 +541,21 @@ i915_gem_execbuffer(struct drm_device *dev, void *data,  		}  	} +	for (i = 0; i < args->buffer_count; i++) { +		struct drm_gem_object *obj = object_list[i]; +		struct drm_i915_gem_object *obj_priv = obj->driver_private; + +		if (obj_priv->gtt_space == NULL) { +			/* We evicted the buffer in the process of validating +			 * our set of buffers in.  We could try to recover by +			 * kicking them everything out and trying again from +			 * the start. +			 */ +			ret = -ENOMEM; +			goto err; +		} +	} +  	exec_offset = validate_list[args->buffer_count - 1].buffer_offset;  	/* make sure all previous memory operations have passed */ @@ -484,6 +575,25 @@ i915_gem_execbuffer(struct drm_device *dev, void *data,  		goto err;  	} +	/* Flush the rendering.  We want this flush to go away, which will +	 * require intelligent cache management. +	 */ +	i915_gem_flush(dev); + +	/* Get a cookie representing the flush of the current buffer, which we +	 * can wait on.  We would like to mitigate these interrupts, likely by +	 * only flushing occasionally (so that we have *some* interrupts +	 * representing completion of buffers that we can wait on when trying +	 * to clear up gtt space). +	 */ +	cookie = i915_emit_irq(dev); +	for (i = 0; i < args->buffer_count; i++) { +		struct drm_gem_object *obj = object_list[i]; +		struct drm_i915_gem_object *obj_priv = obj->driver_private; + +		obj_priv->last_rendering_cookie = cookie; +	} +  	/* Copy the new buffer offsets back to the user's validate list. */  	ret = copy_to_user((struct drm_i915_relocation_entry __user*)(uintptr_t)  			   args->buffers_ptr, @@ -492,28 +602,6 @@ i915_gem_execbuffer(struct drm_device *dev, void *data,  	if (ret)  		DRM_ERROR ("failed to copy %d validate entries back to user (%d)\n",  			   args->buffer_count, ret); - -	/* Clean up and return */ -	ret = i915_gem_sync(dev); -	if (ret) -	{ -		drm_i915_private_t *dev_priv = dev->dev_private; -		uint32_t acthd = I915_READ(IS_I965G(dev) ? I965REG_ACTHD : I915REG_ACTHD); -		DRM_ERROR ("failed to sync %d acthd %08x\n", ret, acthd); -		i915_gem_dump_object (object_list[args->buffer_count - 1], -				      args->batch_len, -				      __FUNCTION__, -				      acthd); -	} - -	/* Evict all the buffers we moved in, leaving room for the next guy. */ -	for (i = 0; i < args->buffer_count; i++) { -		struct drm_gem_object *obj = object_list[i]; -		struct drm_i915_gem_object *obj_priv = obj->driver_private; - -		if (obj_priv->pin_count == 0) -			i915_gem_object_unbind(obj); -	}  err:  	if (object_list != NULL) {  		for (i = 0; i < args->buffer_count; i++) @@ -592,7 +680,7 @@ int i915_gem_init_object(struct drm_gem_object *obj)  		return -ENOMEM;  	obj->driver_private = obj_priv; - +	INIT_LIST_HEAD(&obj_priv->gtt_lru_entry);  	return 0;  } | 
