Skip to content

Commit 63cf4ca

Browse files
author
Thomas Hellström
committed
drm/i915: Break out the i915_deps utility
Since it's starting to be used outside the i915 TTM move code, move it to a separate set of files. v2: - Update the documentation. v4: - Rebase. Signed-off-by: Thomas Hellström <[email protected]> Reviewed-by: Matthew Auld <[email protected]> Link: https://patchwork.freedesktop.org/patch/msgid/[email protected]
1 parent 33654ef commit 63cf4ca

File tree

6 files changed

+285
-188
lines changed

6 files changed

+285
-188
lines changed

drivers/gpu/drm/i915/Makefile

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -163,6 +163,7 @@ i915-y += \
163163
i915_active.o \
164164
i915_buddy.o \
165165
i915_cmd_parser.o \
166+
i915_deps.o \
166167
i915_gem_evict.o \
167168
i915_gem_gtt.o \
168169
i915_gem_ww.o \

drivers/gpu/drm/i915/gem/i915_gem_ttm_move.c

Lines changed: 1 addition & 170 deletions
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,7 @@
55

66
#include <drm/ttm/ttm_bo_driver.h>
77

8+
#include "i915_deps.h"
89
#include "i915_drv.h"
910
#include "intel_memory_region.h"
1011
#include "intel_region_ttm.h"
@@ -41,176 +42,6 @@ void i915_ttm_migrate_set_failure_modes(bool gpu_migration,
4142
}
4243
#endif
4344

44-
/**
45-
* DOC: Set of utilities to dynamically collect dependencies into a
46-
* structure which is fed into the GT migration code.
47-
*
48-
* Once we can do async unbinding, this is also needed to coalesce
49-
* the migration fence with the unbind fences if these are coalesced
50-
* post-migration.
51-
*
52-
* While collecting the individual dependencies, we store the refcounted
53-
* struct dma_fence pointers in a realloc-managed pointer array, since
54-
* that can be easily fed into a dma_fence_array. Other options are
55-
* available, like for example an xarray for similarity with drm/sched.
56-
* Can be changed easily if needed.
57-
*
58-
* A struct i915_deps need to be initialized using i915_deps_init().
59-
* If i915_deps_add_dependency() or i915_deps_add_resv() return an
60-
* error code they will internally call i915_deps_fini(), which frees
61-
* all internal references and allocations.
62-
*
63-
* We might want to break this out into a separate file as a utility.
64-
*/
65-
66-
#define I915_DEPS_MIN_ALLOC_CHUNK 8U
67-
68-
static void i915_deps_reset_fences(struct i915_deps *deps)
69-
{
70-
if (deps->fences != &deps->single)
71-
kfree(deps->fences);
72-
deps->num_deps = 0;
73-
deps->fences_size = 1;
74-
deps->fences = &deps->single;
75-
}
76-
77-
static void i915_deps_init(struct i915_deps *deps, gfp_t gfp)
78-
{
79-
deps->fences = NULL;
80-
deps->gfp = gfp;
81-
i915_deps_reset_fences(deps);
82-
}
83-
84-
static void i915_deps_fini(struct i915_deps *deps)
85-
{
86-
unsigned int i;
87-
88-
for (i = 0; i < deps->num_deps; ++i)
89-
dma_fence_put(deps->fences[i]);
90-
91-
if (deps->fences != &deps->single)
92-
kfree(deps->fences);
93-
}
94-
95-
static int i915_deps_grow(struct i915_deps *deps, struct dma_fence *fence,
96-
const struct ttm_operation_ctx *ctx)
97-
{
98-
int ret;
99-
100-
if (deps->num_deps >= deps->fences_size) {
101-
unsigned int new_size = 2 * deps->fences_size;
102-
struct dma_fence **new_fences;
103-
104-
new_size = max(new_size, I915_DEPS_MIN_ALLOC_CHUNK);
105-
new_fences = kmalloc_array(new_size, sizeof(*new_fences), deps->gfp);
106-
if (!new_fences)
107-
goto sync;
108-
109-
memcpy(new_fences, deps->fences,
110-
deps->fences_size * sizeof(*new_fences));
111-
swap(new_fences, deps->fences);
112-
if (new_fences != &deps->single)
113-
kfree(new_fences);
114-
deps->fences_size = new_size;
115-
}
116-
deps->fences[deps->num_deps++] = dma_fence_get(fence);
117-
return 0;
118-
119-
sync:
120-
if (ctx->no_wait_gpu && !dma_fence_is_signaled(fence)) {
121-
ret = -EBUSY;
122-
goto unref;
123-
}
124-
125-
ret = dma_fence_wait(fence, ctx->interruptible);
126-
if (ret)
127-
goto unref;
128-
129-
ret = fence->error;
130-
if (ret)
131-
goto unref;
132-
133-
return 0;
134-
135-
unref:
136-
i915_deps_fini(deps);
137-
return ret;
138-
}
139-
140-
static int i915_deps_sync(const struct i915_deps *deps,
141-
const struct ttm_operation_ctx *ctx)
142-
{
143-
struct dma_fence **fences = deps->fences;
144-
unsigned int i;
145-
int ret = 0;
146-
147-
for (i = 0; i < deps->num_deps; ++i, ++fences) {
148-
if (ctx->no_wait_gpu && !dma_fence_is_signaled(*fences)) {
149-
ret = -EBUSY;
150-
break;
151-
}
152-
153-
ret = dma_fence_wait(*fences, ctx->interruptible);
154-
if (!ret)
155-
ret = (*fences)->error;
156-
if (ret)
157-
break;
158-
}
159-
160-
return ret;
161-
}
162-
163-
static int i915_deps_add_dependency(struct i915_deps *deps,
164-
struct dma_fence *fence,
165-
const struct ttm_operation_ctx *ctx)
166-
{
167-
unsigned int i;
168-
int ret;
169-
170-
if (!fence)
171-
return 0;
172-
173-
if (dma_fence_is_signaled(fence)) {
174-
ret = fence->error;
175-
if (ret)
176-
i915_deps_fini(deps);
177-
return ret;
178-
}
179-
180-
for (i = 0; i < deps->num_deps; ++i) {
181-
struct dma_fence *entry = deps->fences[i];
182-
183-
if (!entry->context || entry->context != fence->context)
184-
continue;
185-
186-
if (dma_fence_is_later(fence, entry)) {
187-
dma_fence_put(entry);
188-
deps->fences[i] = dma_fence_get(fence);
189-
}
190-
191-
return 0;
192-
}
193-
194-
return i915_deps_grow(deps, fence, ctx);
195-
}
196-
197-
static int i915_deps_add_resv(struct i915_deps *deps, struct dma_resv *resv,
198-
const struct ttm_operation_ctx *ctx)
199-
{
200-
struct dma_resv_iter iter;
201-
struct dma_fence *fence;
202-
int ret;
203-
204-
dma_resv_assert_held(resv);
205-
dma_resv_for_each_fence(&iter, resv, true, fence) {
206-
ret = i915_deps_add_dependency(deps, fence, ctx);
207-
if (ret)
208-
return ret;
209-
}
210-
211-
return 0;
212-
}
213-
21445
static enum i915_cache_level
21546
i915_ttm_cache_level(struct drm_i915_private *i915, struct ttm_resource *res,
21647
struct ttm_tt *ttm)

drivers/gpu/drm/i915/gem/i915_gem_ttm_move.h

Lines changed: 0 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -18,23 +18,6 @@ struct ttm_tt;
1818
struct drm_i915_gem_object;
1919
struct i915_refct_sgt;
2020

21-
/**
22-
* struct i915_deps - Collect dependencies into a single dma-fence
23-
* @single: Storage for pointer if the collection is a single fence.
24-
* @fences: Allocated array of fence pointers if more than a single fence;
25-
* otherwise points to the address of @single.
26-
* @num_deps: Current number of dependency fences.
27-
* @fences_size: Size of the @fences array in number of pointers.
28-
* @gfp: Allocation mode.
29-
*/
30-
struct i915_deps {
31-
struct dma_fence *single;
32-
struct dma_fence **fences;
33-
unsigned int num_deps;
34-
unsigned int fences_size;
35-
gfp_t gfp;
36-
};
37-
3821
int i915_ttm_move_notify(struct ttm_buffer_object *bo);
3922

4023
I915_SELFTEST_DECLARE(void i915_ttm_migrate_set_failure_modes(bool gpu_migration,

0 commit comments

Comments
 (0)