mirror of
				git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
				synced 2025-09-04 20:19:47 +08:00 
			
		
		
		
	drm/i915: Use a radixtree for random access to the object's backing storage
A while ago we switched from a contiguous array of pages into an sglist, for that was both more convenient for mapping to hardware and avoided the requirement for a vmalloc array of pages on every object. However, certain GEM API calls (like pwrite, pread as well as performing relocations) do desire access to individual struct pages. A quick hack was to introduce a cache of the last access such that finding the following page was quick - this works so long as the caller desired sequential access. Walking backwards, or multiple callers, still hits a slow linear search for each page. One solution is to store each successful lookup in a radix tree. v2: Rewrite building the radixtree for clarity, hopefully. v3: Rearrange execbuf to avoid calling i915_gem_object_get_sg() from within an atomic section and so relax the allocation context to a simple GFP_KERNEL and mutex. Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk> Reviewed-by: Tvrtko Ursulin <tvrtko.ursulin@intel.com> Link: http://patchwork.freedesktop.org/patch/msgid/20161028125858.23563-10-chris@chris-wilson.co.uk
This commit is contained in:
		
							parent
							
								
									4c7d62c6b8
								
							
						
					
					
						commit
						96d7763452
					
				| @ -2286,9 +2286,12 @@ struct drm_i915_gem_object { | |||||||
| 
 | 
 | ||||||
| 	struct sg_table *pages; | 	struct sg_table *pages; | ||||||
| 	int pages_pin_count; | 	int pages_pin_count; | ||||||
| 	struct get_page { | 	struct i915_gem_object_page_iter { | ||||||
| 		struct scatterlist *sg; | 		struct scatterlist *sg_pos; | ||||||
| 		int last; | 		unsigned int sg_idx; /* in pages, but 32bit eek! */ | ||||||
|  | 
 | ||||||
|  | 		struct radix_tree_root radix; | ||||||
|  | 		struct mutex lock; /* protects this cache */ | ||||||
| 	} get_page; | 	} get_page; | ||||||
| 	void *mapping; | 	void *mapping; | ||||||
| 
 | 
 | ||||||
| @ -2491,6 +2494,14 @@ static __always_inline struct sgt_iter { | |||||||
| 	return s; | 	return s; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | static inline struct scatterlist *____sg_next(struct scatterlist *sg) | ||||||
|  | { | ||||||
|  | 	++sg; | ||||||
|  | 	if (unlikely(sg_is_chain(sg))) | ||||||
|  | 		sg = sg_chain_ptr(sg); | ||||||
|  | 	return sg; | ||||||
|  | } | ||||||
|  | 
 | ||||||
| /**
 | /**
 | ||||||
|  * __sg_next - return the next scatterlist entry in a list |  * __sg_next - return the next scatterlist entry in a list | ||||||
|  * @sg:		The current sg entry |  * @sg:		The current sg entry | ||||||
| @ -2505,9 +2516,7 @@ static inline struct scatterlist *__sg_next(struct scatterlist *sg) | |||||||
| #ifdef CONFIG_DEBUG_SG | #ifdef CONFIG_DEBUG_SG | ||||||
| 	BUG_ON(sg->sg_magic != SG_MAGIC); | 	BUG_ON(sg->sg_magic != SG_MAGIC); | ||||||
| #endif | #endif | ||||||
| 	return sg_is_last(sg) ? NULL : | 	return sg_is_last(sg) ? NULL : ____sg_next(sg); | ||||||
| 		likely(!sg_is_chain(++sg)) ? sg : |  | ||||||
| 		sg_chain_ptr(sg); |  | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| /**
 | /**
 | ||||||
| @ -3185,45 +3194,21 @@ static inline int __sg_page_count(struct scatterlist *sg) | |||||||
| 	return sg->length >> PAGE_SHIFT; | 	return sg->length >> PAGE_SHIFT; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | struct scatterlist * | ||||||
|  | i915_gem_object_get_sg(struct drm_i915_gem_object *obj, | ||||||
|  | 		       unsigned int n, unsigned int *offset); | ||||||
|  | 
 | ||||||
| struct page * | struct page * | ||||||
| i915_gem_object_get_dirty_page(struct drm_i915_gem_object *obj, int n); | i915_gem_object_get_page(struct drm_i915_gem_object *obj, | ||||||
|  | 			 unsigned int n); | ||||||
| 
 | 
 | ||||||
| static inline dma_addr_t | struct page * | ||||||
| i915_gem_object_get_dma_address(struct drm_i915_gem_object *obj, int n) | i915_gem_object_get_dirty_page(struct drm_i915_gem_object *obj, | ||||||
| { | 			       unsigned int n); | ||||||
| 	if (n < obj->get_page.last) { |  | ||||||
| 		obj->get_page.sg = obj->pages->sgl; |  | ||||||
| 		obj->get_page.last = 0; |  | ||||||
| 	} |  | ||||||
| 
 | 
 | ||||||
| 	while (obj->get_page.last + __sg_page_count(obj->get_page.sg) <= n) { | dma_addr_t | ||||||
| 		obj->get_page.last += __sg_page_count(obj->get_page.sg++); | i915_gem_object_get_dma_address(struct drm_i915_gem_object *obj, | ||||||
| 		if (unlikely(sg_is_chain(obj->get_page.sg))) | 				unsigned long n); | ||||||
| 			obj->get_page.sg = sg_chain_ptr(obj->get_page.sg); |  | ||||||
| 	} |  | ||||||
| 
 |  | ||||||
| 	return sg_dma_address(obj->get_page.sg) + ((n - obj->get_page.last) << PAGE_SHIFT); |  | ||||||
| } |  | ||||||
| 
 |  | ||||||
| static inline struct page * |  | ||||||
| i915_gem_object_get_page(struct drm_i915_gem_object *obj, int n) |  | ||||||
| { |  | ||||||
| 	if (WARN_ON(n >= obj->base.size >> PAGE_SHIFT)) |  | ||||||
| 		return NULL; |  | ||||||
| 
 |  | ||||||
| 	if (n < obj->get_page.last) { |  | ||||||
| 		obj->get_page.sg = obj->pages->sgl; |  | ||||||
| 		obj->get_page.last = 0; |  | ||||||
| 	} |  | ||||||
| 
 |  | ||||||
| 	while (obj->get_page.last + __sg_page_count(obj->get_page.sg) <= n) { |  | ||||||
| 		obj->get_page.last += __sg_page_count(obj->get_page.sg++); |  | ||||||
| 		if (unlikely(sg_is_chain(obj->get_page.sg))) |  | ||||||
| 			obj->get_page.sg = sg_chain_ptr(obj->get_page.sg); |  | ||||||
| 	} |  | ||||||
| 
 |  | ||||||
| 	return nth_page(sg_page(obj->get_page.sg), n - obj->get_page.last); |  | ||||||
| } |  | ||||||
| 
 | 
 | ||||||
| static inline void i915_gem_object_pin_pages(struct drm_i915_gem_object *obj) | static inline void i915_gem_object_pin_pages(struct drm_i915_gem_object *obj) | ||||||
| { | { | ||||||
|  | |||||||
| @ -2330,6 +2330,15 @@ i915_gem_object_put_pages_gtt(struct drm_i915_gem_object *obj) | |||||||
| 	kfree(obj->pages); | 	kfree(obj->pages); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
|  | static void __i915_gem_object_reset_page_iter(struct drm_i915_gem_object *obj) | ||||||
|  | { | ||||||
|  | 	struct radix_tree_iter iter; | ||||||
|  | 	void **slot; | ||||||
|  | 
 | ||||||
|  | 	radix_tree_for_each_slot(slot, &obj->get_page.radix, &iter, 0) | ||||||
|  | 		radix_tree_delete(&obj->get_page.radix, iter.index); | ||||||
|  | } | ||||||
|  | 
 | ||||||
| int | int | ||||||
| i915_gem_object_put_pages(struct drm_i915_gem_object *obj) | i915_gem_object_put_pages(struct drm_i915_gem_object *obj) | ||||||
| { | { | ||||||
| @ -2362,6 +2371,8 @@ i915_gem_object_put_pages(struct drm_i915_gem_object *obj) | |||||||
| 		obj->mapping = NULL; | 		obj->mapping = NULL; | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
|  | 	__i915_gem_object_reset_page_iter(obj); | ||||||
|  | 
 | ||||||
| 	ops->put_pages(obj); | 	ops->put_pages(obj); | ||||||
| 	obj->pages = NULL; | 	obj->pages = NULL; | ||||||
| 
 | 
 | ||||||
| @ -2531,8 +2542,8 @@ i915_gem_object_get_pages(struct drm_i915_gem_object *obj) | |||||||
| 
 | 
 | ||||||
| 	list_add_tail(&obj->global_list, &dev_priv->mm.unbound_list); | 	list_add_tail(&obj->global_list, &dev_priv->mm.unbound_list); | ||||||
| 
 | 
 | ||||||
| 	obj->get_page.sg = obj->pages->sgl; | 	obj->get_page.sg_pos = obj->pages->sgl; | ||||||
| 	obj->get_page.last = 0; | 	obj->get_page.sg_idx = 0; | ||||||
| 
 | 
 | ||||||
| 	return 0; | 	return 0; | ||||||
| } | } | ||||||
| @ -4337,6 +4348,8 @@ void i915_gem_object_init(struct drm_i915_gem_object *obj, | |||||||
| 
 | 
 | ||||||
| 	obj->frontbuffer_ggtt_origin = ORIGIN_GTT; | 	obj->frontbuffer_ggtt_origin = ORIGIN_GTT; | ||||||
| 	obj->madv = I915_MADV_WILLNEED; | 	obj->madv = I915_MADV_WILLNEED; | ||||||
|  | 	INIT_RADIX_TREE(&obj->get_page.radix, GFP_KERNEL | __GFP_NOWARN); | ||||||
|  | 	mutex_init(&obj->get_page.lock); | ||||||
| 
 | 
 | ||||||
| 	i915_gem_info_add_obj(to_i915(obj->base.dev), obj->base.size); | 	i915_gem_info_add_obj(to_i915(obj->base.dev), obj->base.size); | ||||||
| } | } | ||||||
| @ -5032,21 +5045,6 @@ void i915_gem_track_fb(struct drm_i915_gem_object *old, | |||||||
| 	} | 	} | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| /* Like i915_gem_object_get_page(), but mark the returned page dirty */ |  | ||||||
| struct page * |  | ||||||
| i915_gem_object_get_dirty_page(struct drm_i915_gem_object *obj, int n) |  | ||||||
| { |  | ||||||
| 	struct page *page; |  | ||||||
| 
 |  | ||||||
| 	/* Only default objects have per-page dirty tracking */ |  | ||||||
| 	if (WARN_ON(!i915_gem_object_has_struct_page(obj))) |  | ||||||
| 		return NULL; |  | ||||||
| 
 |  | ||||||
| 	page = i915_gem_object_get_page(obj, n); |  | ||||||
| 	set_page_dirty(page); |  | ||||||
| 	return page; |  | ||||||
| } |  | ||||||
| 
 |  | ||||||
| /* Allocate a new GEM object and fill it with the supplied data */ | /* Allocate a new GEM object and fill it with the supplied data */ | ||||||
| struct drm_i915_gem_object * | struct drm_i915_gem_object * | ||||||
| i915_gem_object_create_from_data(struct drm_device *dev, | i915_gem_object_create_from_data(struct drm_device *dev, | ||||||
| @ -5087,3 +5085,156 @@ fail: | |||||||
| 	i915_gem_object_put(obj); | 	i915_gem_object_put(obj); | ||||||
| 	return ERR_PTR(ret); | 	return ERR_PTR(ret); | ||||||
| } | } | ||||||
|  | 
 | ||||||
|  | struct scatterlist * | ||||||
|  | i915_gem_object_get_sg(struct drm_i915_gem_object *obj, | ||||||
|  | 		       unsigned int n, | ||||||
|  | 		       unsigned int *offset) | ||||||
|  | { | ||||||
|  | 	struct i915_gem_object_page_iter *iter = &obj->get_page; | ||||||
|  | 	struct scatterlist *sg; | ||||||
|  | 	unsigned int idx, count; | ||||||
|  | 
 | ||||||
|  | 	might_sleep(); | ||||||
|  | 	GEM_BUG_ON(n >= obj->base.size >> PAGE_SHIFT); | ||||||
|  | 	GEM_BUG_ON(obj->pages_pin_count == 0); | ||||||
|  | 
 | ||||||
|  | 	/* As we iterate forward through the sg, we record each entry in a
 | ||||||
|  | 	 * radixtree for quick repeated (backwards) lookups. If we have seen | ||||||
|  | 	 * this index previously, we will have an entry for it. | ||||||
|  | 	 * | ||||||
|  | 	 * Initial lookup is O(N), but this is amortized to O(1) for | ||||||
|  | 	 * sequential page access (where each new request is consecutive | ||||||
|  | 	 * to the previous one). Repeated lookups are O(lg(obj->base.size)), | ||||||
|  | 	 * i.e. O(1) with a large constant! | ||||||
|  | 	 */ | ||||||
|  | 	if (n < READ_ONCE(iter->sg_idx)) | ||||||
|  | 		goto lookup; | ||||||
|  | 
 | ||||||
|  | 	mutex_lock(&iter->lock); | ||||||
|  | 
 | ||||||
|  | 	/* We prefer to reuse the last sg so that repeated lookup of this
 | ||||||
|  | 	 * (or the subsequent) sg are fast - comparing against the last | ||||||
|  | 	 * sg is faster than going through the radixtree. | ||||||
|  | 	 */ | ||||||
|  | 
 | ||||||
|  | 	sg = iter->sg_pos; | ||||||
|  | 	idx = iter->sg_idx; | ||||||
|  | 	count = __sg_page_count(sg); | ||||||
|  | 
 | ||||||
|  | 	while (idx + count <= n) { | ||||||
|  | 		unsigned long exception, i; | ||||||
|  | 		int ret; | ||||||
|  | 
 | ||||||
|  | 		/* If we cannot allocate and insert this entry, or the
 | ||||||
|  | 		 * individual pages from this range, cancel updating the | ||||||
|  | 		 * sg_idx so that on this lookup we are forced to linearly | ||||||
|  | 		 * scan onwards, but on future lookups we will try the | ||||||
|  | 		 * insertion again (in which case we need to be careful of | ||||||
|  | 		 * the error return reporting that we have already inserted | ||||||
|  | 		 * this index). | ||||||
|  | 		 */ | ||||||
|  | 		ret = radix_tree_insert(&iter->radix, idx, sg); | ||||||
|  | 		if (ret && ret != -EEXIST) | ||||||
|  | 			goto scan; | ||||||
|  | 
 | ||||||
|  | 		exception = | ||||||
|  | 			RADIX_TREE_EXCEPTIONAL_ENTRY | | ||||||
|  | 			idx << RADIX_TREE_EXCEPTIONAL_SHIFT; | ||||||
|  | 		for (i = 1; i < count; i++) { | ||||||
|  | 			ret = radix_tree_insert(&iter->radix, idx + i, | ||||||
|  | 						(void *)exception); | ||||||
|  | 			if (ret && ret != -EEXIST) | ||||||
|  | 				goto scan; | ||||||
|  | 		} | ||||||
|  | 
 | ||||||
|  | 		idx += count; | ||||||
|  | 		sg = ____sg_next(sg); | ||||||
|  | 		count = __sg_page_count(sg); | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
|  | scan: | ||||||
|  | 	iter->sg_pos = sg; | ||||||
|  | 	iter->sg_idx = idx; | ||||||
|  | 
 | ||||||
|  | 	mutex_unlock(&iter->lock); | ||||||
|  | 
 | ||||||
|  | 	if (unlikely(n < idx)) /* insertion completed by another thread */ | ||||||
|  | 		goto lookup; | ||||||
|  | 
 | ||||||
|  | 	/* In case we failed to insert the entry into the radixtree, we need
 | ||||||
|  | 	 * to look beyond the current sg. | ||||||
|  | 	 */ | ||||||
|  | 	while (idx + count <= n) { | ||||||
|  | 		idx += count; | ||||||
|  | 		sg = ____sg_next(sg); | ||||||
|  | 		count = __sg_page_count(sg); | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
|  | 	*offset = n - idx; | ||||||
|  | 	return sg; | ||||||
|  | 
 | ||||||
|  | lookup: | ||||||
|  | 	rcu_read_lock(); | ||||||
|  | 
 | ||||||
|  | 	sg = radix_tree_lookup(&iter->radix, n); | ||||||
|  | 	GEM_BUG_ON(!sg); | ||||||
|  | 
 | ||||||
|  | 	/* If this index is in the middle of multi-page sg entry,
 | ||||||
|  | 	 * the radixtree will contain an exceptional entry that points | ||||||
|  | 	 * to the start of that range. We will return the pointer to | ||||||
|  | 	 * the base page and the offset of this page within the | ||||||
|  | 	 * sg entry's range. | ||||||
|  | 	 */ | ||||||
|  | 	*offset = 0; | ||||||
|  | 	if (unlikely(radix_tree_exception(sg))) { | ||||||
|  | 		unsigned long base = | ||||||
|  | 			(unsigned long)sg >> RADIX_TREE_EXCEPTIONAL_SHIFT; | ||||||
|  | 
 | ||||||
|  | 		sg = radix_tree_lookup(&iter->radix, base); | ||||||
|  | 		GEM_BUG_ON(!sg); | ||||||
|  | 
 | ||||||
|  | 		*offset = n - base; | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
|  | 	rcu_read_unlock(); | ||||||
|  | 
 | ||||||
|  | 	return sg; | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | struct page * | ||||||
|  | i915_gem_object_get_page(struct drm_i915_gem_object *obj, unsigned int n) | ||||||
|  | { | ||||||
|  | 	struct scatterlist *sg; | ||||||
|  | 	unsigned int offset; | ||||||
|  | 
 | ||||||
|  | 	GEM_BUG_ON(!i915_gem_object_has_struct_page(obj)); | ||||||
|  | 
 | ||||||
|  | 	sg = i915_gem_object_get_sg(obj, n, &offset); | ||||||
|  | 	return nth_page(sg_page(sg), offset); | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | /* Like i915_gem_object_get_page(), but mark the returned page dirty */ | ||||||
|  | struct page * | ||||||
|  | i915_gem_object_get_dirty_page(struct drm_i915_gem_object *obj, | ||||||
|  | 			       unsigned int n) | ||||||
|  | { | ||||||
|  | 	struct page *page; | ||||||
|  | 
 | ||||||
|  | 	page = i915_gem_object_get_page(obj, n); | ||||||
|  | 	if (!obj->dirty) | ||||||
|  | 		set_page_dirty(page); | ||||||
|  | 
 | ||||||
|  | 	return page; | ||||||
|  | } | ||||||
|  | 
 | ||||||
|  | dma_addr_t | ||||||
|  | i915_gem_object_get_dma_address(struct drm_i915_gem_object *obj, | ||||||
|  | 				unsigned long n) | ||||||
|  | { | ||||||
|  | 	struct scatterlist *sg; | ||||||
|  | 	unsigned int offset; | ||||||
|  | 
 | ||||||
|  | 	sg = i915_gem_object_get_sg(obj, n, &offset); | ||||||
|  | 	return sg_dma_address(sg) + (offset << PAGE_SHIFT); | ||||||
|  | } | ||||||
|  | |||||||
| @ -595,8 +595,8 @@ _i915_gem_object_create_stolen(struct drm_device *dev, | |||||||
| 	if (obj->pages == NULL) | 	if (obj->pages == NULL) | ||||||
| 		goto cleanup; | 		goto cleanup; | ||||||
| 
 | 
 | ||||||
| 	obj->get_page.sg = obj->pages->sgl; | 	obj->get_page.sg_pos = obj->pages->sgl; | ||||||
| 	obj->get_page.last = 0; | 	obj->get_page.sg_idx = 0; | ||||||
| 
 | 
 | ||||||
| 	i915_gem_object_pin_pages(obj); | 	i915_gem_object_pin_pages(obj); | ||||||
| 	obj->stolen = stolen; | 	obj->stolen = stolen; | ||||||
|  | |||||||
| @ -530,8 +530,8 @@ __i915_gem_userptr_get_pages_worker(struct work_struct *_work) | |||||||
| 			if (ret == 0) { | 			if (ret == 0) { | ||||||
| 				list_add_tail(&obj->global_list, | 				list_add_tail(&obj->global_list, | ||||||
| 					      &to_i915(dev)->mm.unbound_list); | 					      &to_i915(dev)->mm.unbound_list); | ||||||
| 				obj->get_page.sg = obj->pages->sgl; | 				obj->get_page.sg_pos = obj->pages->sgl; | ||||||
| 				obj->get_page.last = 0; | 				obj->get_page.sg_idx = 0; | ||||||
| 				pinned = 0; | 				pinned = 0; | ||||||
| 			} | 			} | ||||||
| 		} | 		} | ||||||
|  | |||||||
		Loading…
	
		Reference in New Issue
	
	Block a user
	 Chris Wilson
						Chris Wilson