Skip to content

Commit 2459e56

Browse files
committed
drm/i915/uapi: implement object placement extension
Add new extension to support setting an immutable-priority-list of potential placements, at creation time. If we use the normal gem_create or gem_create_ext without the extensions/placements then we still get the old behaviour with only placing the object in system memory. v2(Daniel & Jason): - Add a bunch of kernel-doc - Simplify design for placements extension Testcase: igt/gem_create/create-ext-placement-sanity-check Testcase: igt/gem_create/create-ext-placement-each Testcase: igt/gem_create/create-ext-placement-all Signed-off-by: Matthew Auld <[email protected]> Signed-off-by: CQ Tang <[email protected]> Cc: Joonas Lahtinen <[email protected]> Cc: Daniele Ceraolo Spurio <[email protected]> Cc: Lionel Landwerlin <[email protected]> Cc: Jordan Justen <[email protected]> Cc: Daniel Vetter <[email protected]> Cc: Kenneth Graunke <[email protected]> Cc: Jason Ekstrand <[email protected]> Cc: Dave Airlie <[email protected]> Cc: [email protected] Cc: [email protected] Reviewed-by: Kenneth Graunke <[email protected]> Link: https://patchwork.freedesktop.org/patch/msgid/[email protected]
1 parent ebcb402 commit 2459e56

File tree

7 files changed

+318
-17
lines changed

7 files changed

+318
-17
lines changed

drivers/gpu/drm/i915/gem/i915_gem_create.c

Lines changed: 201 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -4,12 +4,51 @@
44
*/
55

66
#include "gem/i915_gem_ioctls.h"
7+
#include "gem/i915_gem_lmem.h"
78
#include "gem/i915_gem_region.h"
89

910
#include "i915_drv.h"
1011
#include "i915_trace.h"
1112
#include "i915_user_extensions.h"
1213

14+
static u32 object_max_page_size(struct drm_i915_gem_object *obj)
15+
{
16+
u32 max_page_size = 0;
17+
int i;
18+
19+
for (i = 0; i < obj->mm.n_placements; i++) {
20+
struct intel_memory_region *mr = obj->mm.placements[i];
21+
22+
GEM_BUG_ON(!is_power_of_2(mr->min_page_size));
23+
max_page_size = max_t(u32, max_page_size, mr->min_page_size);
24+
}
25+
26+
GEM_BUG_ON(!max_page_size);
27+
return max_page_size;
28+
}
29+
30+
static void object_set_placements(struct drm_i915_gem_object *obj,
31+
struct intel_memory_region **placements,
32+
unsigned int n_placements)
33+
{
34+
GEM_BUG_ON(!n_placements);
35+
36+
/*
37+
* For the common case of one memory region, skip storing an
38+
* allocated array and just point at the region directly.
39+
*/
40+
if (n_placements == 1) {
41+
struct intel_memory_region *mr = placements[0];
42+
struct drm_i915_private *i915 = mr->i915;
43+
44+
obj->mm.placements = &i915->mm.regions[mr->id];
45+
obj->mm.n_placements = 1;
46+
} else {
47+
obj->mm.placements = placements;
48+
obj->mm.n_placements = n_placements;
49+
}
50+
}
51+
1352
static int i915_gem_publish(struct drm_i915_gem_object *obj,
1453
struct drm_file *file,
1554
u64 *size_p,
@@ -29,14 +68,12 @@ static int i915_gem_publish(struct drm_i915_gem_object *obj,
2968
}
3069

3170
static int
32-
i915_gem_setup(struct drm_i915_gem_object *obj,
33-
struct intel_memory_region *mr,
34-
u64 size)
71+
i915_gem_setup(struct drm_i915_gem_object *obj, u64 size)
3572
{
73+
struct intel_memory_region *mr = obj->mm.placements[0];
3674
int ret;
3775

38-
GEM_BUG_ON(!is_power_of_2(mr->min_page_size));
39-
size = round_up(size, mr->min_page_size);
76+
size = round_up(size, object_max_page_size(obj));
4077
if (size == 0)
4178
return -EINVAL;
4279

@@ -62,6 +99,7 @@ i915_gem_dumb_create(struct drm_file *file,
6299
struct drm_mode_create_dumb *args)
63100
{
64101
struct drm_i915_gem_object *obj;
102+
struct intel_memory_region *mr;
65103
enum intel_memory_type mem_type;
66104
int cpp = DIV_ROUND_UP(args->bpp, 8);
67105
u32 format;
@@ -102,10 +140,10 @@ i915_gem_dumb_create(struct drm_file *file,
102140
if (!obj)
103141
return -ENOMEM;
104142

105-
ret = i915_gem_setup(obj,
106-
intel_memory_region_by_type(to_i915(dev),
107-
mem_type),
108-
args->size);
143+
mr = intel_memory_region_by_type(to_i915(dev), mem_type);
144+
object_set_placements(obj, &mr, 1);
145+
146+
ret = i915_gem_setup(obj, args->size);
109147
if (ret)
110148
goto object_free;
111149

@@ -129,6 +167,7 @@ i915_gem_create_ioctl(struct drm_device *dev, void *data,
129167
struct drm_i915_private *i915 = to_i915(dev);
130168
struct drm_i915_gem_create *args = data;
131169
struct drm_i915_gem_object *obj;
170+
struct intel_memory_region *mr;
132171
int ret;
133172

134173
i915_gem_flush_free_objects(i915);
@@ -137,10 +176,10 @@ i915_gem_create_ioctl(struct drm_device *dev, void *data,
137176
if (!obj)
138177
return -ENOMEM;
139178

140-
ret = i915_gem_setup(obj,
141-
intel_memory_region_by_type(i915,
142-
INTEL_MEMORY_SYSTEM),
143-
args->size);
179+
mr = intel_memory_region_by_type(i915, INTEL_MEMORY_SYSTEM);
180+
object_set_placements(obj, &mr, 1);
181+
182+
ret = i915_gem_setup(obj, args->size);
144183
if (ret)
145184
goto object_free;
146185

@@ -156,7 +195,144 @@ struct create_ext {
156195
struct drm_i915_gem_object *vanilla_object;
157196
};
158197

198+
static void repr_placements(char *buf, size_t size,
199+
struct intel_memory_region **placements,
200+
int n_placements)
201+
{
202+
int i;
203+
204+
buf[0] = '\0';
205+
206+
for (i = 0; i < n_placements; i++) {
207+
struct intel_memory_region *mr = placements[i];
208+
int r;
209+
210+
r = snprintf(buf, size, "\n %s -> { class: %d, inst: %d }",
211+
mr->name, mr->type, mr->instance);
212+
if (r >= size)
213+
return;
214+
215+
buf += r;
216+
size -= r;
217+
}
218+
}
219+
220+
static int set_placements(struct drm_i915_gem_create_ext_memory_regions *args,
221+
struct create_ext *ext_data)
222+
{
223+
struct drm_i915_private *i915 = ext_data->i915;
224+
struct drm_i915_gem_memory_class_instance __user *uregions =
225+
u64_to_user_ptr(args->regions);
226+
struct drm_i915_gem_object *obj = ext_data->vanilla_object;
227+
struct intel_memory_region **placements;
228+
u32 mask;
229+
int i, ret = 0;
230+
231+
if (args->pad) {
232+
drm_dbg(&i915->drm, "pad should be zero\n");
233+
ret = -EINVAL;
234+
}
235+
236+
if (!args->num_regions) {
237+
drm_dbg(&i915->drm, "num_regions is zero\n");
238+
ret = -EINVAL;
239+
}
240+
241+
if (args->num_regions > ARRAY_SIZE(i915->mm.regions)) {
242+
drm_dbg(&i915->drm, "num_regions is too large\n");
243+
ret = -EINVAL;
244+
}
245+
246+
if (ret)
247+
return ret;
248+
249+
placements = kmalloc_array(args->num_regions,
250+
sizeof(struct intel_memory_region *),
251+
GFP_KERNEL);
252+
if (!placements)
253+
return -ENOMEM;
254+
255+
mask = 0;
256+
for (i = 0; i < args->num_regions; i++) {
257+
struct drm_i915_gem_memory_class_instance region;
258+
struct intel_memory_region *mr;
259+
260+
if (copy_from_user(&region, uregions, sizeof(region))) {
261+
ret = -EFAULT;
262+
goto out_free;
263+
}
264+
265+
mr = intel_memory_region_lookup(i915,
266+
region.memory_class,
267+
region.memory_instance);
268+
if (!mr || mr->private) {
269+
drm_dbg(&i915->drm, "Device is missing region { class: %d, inst: %d } at index = %d\n",
270+
region.memory_class, region.memory_instance, i);
271+
ret = -EINVAL;
272+
goto out_dump;
273+
}
274+
275+
if (mask & BIT(mr->id)) {
276+
drm_dbg(&i915->drm, "Found duplicate placement %s -> { class: %d, inst: %d } at index = %d\n",
277+
mr->name, region.memory_class,
278+
region.memory_instance, i);
279+
ret = -EINVAL;
280+
goto out_dump;
281+
}
282+
283+
placements[i] = mr;
284+
mask |= BIT(mr->id);
285+
286+
++uregions;
287+
}
288+
289+
if (obj->mm.placements) {
290+
ret = -EINVAL;
291+
goto out_dump;
292+
}
293+
294+
object_set_placements(obj, placements, args->num_regions);
295+
if (args->num_regions == 1)
296+
kfree(placements);
297+
298+
return 0;
299+
300+
out_dump:
301+
if (1) {
302+
char buf[256];
303+
304+
if (obj->mm.placements) {
305+
repr_placements(buf,
306+
sizeof(buf),
307+
obj->mm.placements,
308+
obj->mm.n_placements);
309+
drm_dbg(&i915->drm,
310+
"Placements were already set in previous EXT. Existing placements: %s\n",
311+
buf);
312+
}
313+
314+
repr_placements(buf, sizeof(buf), placements, i);
315+
drm_dbg(&i915->drm, "New placements(so far validated): %s\n", buf);
316+
}
317+
318+
out_free:
319+
kfree(placements);
320+
return ret;
321+
}
322+
323+
static int ext_set_placements(struct i915_user_extension __user *base,
324+
void *data)
325+
{
326+
struct drm_i915_gem_create_ext_memory_regions ext;
327+
328+
if (copy_from_user(&ext, base, sizeof(ext)))
329+
return -EFAULT;
330+
331+
return set_placements(&ext, data);
332+
}
333+
159334
static const i915_user_extension_fn create_extensions[] = {
335+
[I915_GEM_CREATE_EXT_MEMORY_REGIONS] = ext_set_placements,
160336
};
161337

162338
/**
@@ -172,6 +348,7 @@ i915_gem_create_ext_ioctl(struct drm_device *dev, void *data,
172348
struct drm_i915_private *i915 = to_i915(dev);
173349
struct drm_i915_gem_create_ext *args = data;
174350
struct create_ext ext_data = { .i915 = i915 };
351+
struct intel_memory_region **placements_ext;
175352
struct drm_i915_gem_object *obj;
176353
int ret;
177354

@@ -189,19 +366,26 @@ i915_gem_create_ext_ioctl(struct drm_device *dev, void *data,
189366
create_extensions,
190367
ARRAY_SIZE(create_extensions),
191368
&ext_data);
369+
placements_ext = obj->mm.placements;
192370
if (ret)
193371
goto object_free;
194372

195-
ret = i915_gem_setup(obj,
196-
intel_memory_region_by_type(i915,
197-
INTEL_MEMORY_SYSTEM),
198-
args->size);
373+
if (!placements_ext) {
374+
struct intel_memory_region *mr =
375+
intel_memory_region_by_type(i915, INTEL_MEMORY_SYSTEM);
376+
377+
object_set_placements(obj, &mr, 1);
378+
}
379+
380+
ret = i915_gem_setup(obj, args->size);
199381
if (ret)
200382
goto object_free;
201383

202384
return i915_gem_publish(obj, file, &args->size, &args->handle);
203385

204386
object_free:
387+
if (obj->mm.n_placements > 1)
388+
kfree(placements_ext);
205389
i915_gem_object_free(obj);
206390
return ret;
207391
}

drivers/gpu/drm/i915/gem/i915_gem_object.c

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -249,6 +249,9 @@ static void __i915_gem_free_objects(struct drm_i915_private *i915,
249249
if (obj->ops->release)
250250
obj->ops->release(obj);
251251

252+
if (obj->mm.n_placements > 1)
253+
kfree(obj->mm.placements);
254+
252255
/* But keep the pointer alive for RCU-protected lookups */
253256
call_rcu(&obj->rcu, __i915_gem_free_object_rcu);
254257
cond_resched();

drivers/gpu/drm/i915/gem/i915_gem_object_types.h

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -219,6 +219,12 @@ struct drm_i915_gem_object {
219219
atomic_t pages_pin_count;
220220
atomic_t shrink_pin;
221221

222+
/**
223+
* Priority list of potential placements for this object.
224+
*/
225+
struct intel_memory_region **placements;
226+
int n_placements;
227+
222228
/**
223229
* Memory region for this object.
224230
*/

drivers/gpu/drm/i915/gem/selftests/i915_gem_mman.c

Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -842,6 +842,24 @@ static bool can_mmap(struct drm_i915_gem_object *obj, enum i915_mmap_type type)
842842
return true;
843843
}
844844

845+
static void object_set_placements(struct drm_i915_gem_object *obj,
846+
struct intel_memory_region **placements,
847+
unsigned int n_placements)
848+
{
849+
GEM_BUG_ON(!n_placements);
850+
851+
if (n_placements == 1) {
852+
struct drm_i915_private *i915 = to_i915(obj->base.dev);
853+
struct intel_memory_region *mr = placements[0];
854+
855+
obj->mm.placements = &i915->mm.regions[mr->id];
856+
obj->mm.n_placements = 1;
857+
} else {
858+
obj->mm.placements = placements;
859+
obj->mm.n_placements = n_placements;
860+
}
861+
}
862+
845863
#define expand32(x) (((x) << 0) | ((x) << 8) | ((x) << 16) | ((x) << 24))
846864
static int __igt_mmap(struct drm_i915_private *i915,
847865
struct drm_i915_gem_object *obj,
@@ -950,6 +968,8 @@ static int igt_mmap(void *arg)
950968
if (IS_ERR(obj))
951969
return PTR_ERR(obj);
952970

971+
object_set_placements(obj, &mr, 1);
972+
953973
err = __igt_mmap(i915, obj, I915_MMAP_TYPE_GTT);
954974
if (err == 0)
955975
err = __igt_mmap(i915, obj, I915_MMAP_TYPE_WC);
@@ -1068,6 +1088,8 @@ static int igt_mmap_access(void *arg)
10681088
if (IS_ERR(obj))
10691089
return PTR_ERR(obj);
10701090

1091+
object_set_placements(obj, &mr, 1);
1092+
10711093
err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_GTT);
10721094
if (err == 0)
10731095
err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_WB);
@@ -1211,6 +1233,8 @@ static int igt_mmap_gpu(void *arg)
12111233
if (IS_ERR(obj))
12121234
return PTR_ERR(obj);
12131235

1236+
object_set_placements(obj, &mr, 1);
1237+
12141238
err = __igt_mmap_gpu(i915, obj, I915_MMAP_TYPE_GTT);
12151239
if (err == 0)
12161240
err = __igt_mmap_gpu(i915, obj, I915_MMAP_TYPE_WC);
@@ -1354,6 +1378,8 @@ static int igt_mmap_revoke(void *arg)
13541378
if (IS_ERR(obj))
13551379
return PTR_ERR(obj);
13561380

1381+
object_set_placements(obj, &mr, 1);
1382+
13571383
err = __igt_mmap_revoke(i915, obj, I915_MMAP_TYPE_GTT);
13581384
if (err == 0)
13591385
err = __igt_mmap_revoke(i915, obj, I915_MMAP_TYPE_WC);

0 commit comments

Comments
 (0)