Skip to content

Commit a9ac0fa

Browse files
committed
drm/xe: Strict migration policy for atomic SVM faults
Mixing GPU and CPU atomics does not work unless a strict migration policy of GPU atomics must be device memory. Enforce a policy of must be in VRAM with a retry loop of 3 attempts, if retry loop fails abort fault. Removing always_migrate_to_vram modparam as we now have real migration policy. v2: - Only retry migration on atomics - Drop alway migrate modparam v3: - Only set vram_only on DGFX (Himal) - Bail on get_pages failure if vram_only and retry count exceeded (Himal) - s/vram_only/devmem_only - Update xe_svm_range_is_valid to accept devmem_only argument v4: - Fix logic bug get_pages failure v5: - Fix commit message (Himal) - Mention removing always_migrate_to_vram in commit message (Lucas) - Fix xe_svm_range_is_valid to check for devmem pages - Bail on devmem_only && !migrate_devmem (Thomas) v6: - Add READ_ONCE barriers for opportunistic checks (Thomas) - Pair READ_ONCE with WRITE_ONCE (Thomas) v7: - Adjust comments (Thomas) Fixes: 2f118c9 ("drm/xe: Add SVM VRAM migration") Cc: stable@vger.kernel.org Signed-off-by: Himal Prasad Ghimiray <himal.prasad.ghimiray@intel.com> Signed-off-by: Matthew Brost <matthew.brost@intel.com> Acked-by: Himal Prasad Ghimiray <himal.prasad.ghimiray@intel.com> Reviewed-by: Thomas Hellström <thomas.hellstrom@linux.intel.com> Link: https://lore.kernel.org/r/20250512135500.1405019-3-matthew.brost@intel.com
1 parent 8a9b978 commit a9ac0fa

File tree

7 files changed

+140
-57
lines changed

7 files changed

+140
-57
lines changed

drivers/gpu/drm/drm_gpusvm.c

Lines changed: 18 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1118,6 +1118,10 @@ static void __drm_gpusvm_range_unmap_pages(struct drm_gpusvm *gpusvm,
11181118
lockdep_assert_held(&gpusvm->notifier_lock);
11191119

11201120
if (range->flags.has_dma_mapping) {
1121+
struct drm_gpusvm_range_flags flags = {
1122+
.__flags = range->flags.__flags,
1123+
};
1124+
11211125
for (i = 0, j = 0; i < npages; j++) {
11221126
struct drm_pagemap_device_addr *addr = &range->dma_addr[j];
11231127

@@ -1131,8 +1135,12 @@ static void __drm_gpusvm_range_unmap_pages(struct drm_gpusvm *gpusvm,
11311135
dev, *addr);
11321136
i += 1 << addr->order;
11331137
}
1134-
range->flags.has_devmem_pages = false;
1135-
range->flags.has_dma_mapping = false;
1138+
1139+
/* WRITE_ONCE pairs with READ_ONCE for opportunistic checks */
1140+
flags.has_devmem_pages = false;
1141+
flags.has_dma_mapping = false;
1142+
WRITE_ONCE(range->flags.__flags, flags.__flags);
1143+
11361144
range->dpagemap = NULL;
11371145
}
11381146
}
@@ -1334,6 +1342,7 @@ int drm_gpusvm_range_get_pages(struct drm_gpusvm *gpusvm,
13341342
int err = 0;
13351343
struct dev_pagemap *pagemap;
13361344
struct drm_pagemap *dpagemap;
1345+
struct drm_gpusvm_range_flags flags;
13371346

13381347
retry:
13391348
hmm_range.notifier_seq = mmu_interval_read_begin(notifier);
@@ -1378,7 +1387,8 @@ int drm_gpusvm_range_get_pages(struct drm_gpusvm *gpusvm,
13781387
*/
13791388
drm_gpusvm_notifier_lock(gpusvm);
13801389

1381-
if (range->flags.unmapped) {
1390+
flags.__flags = range->flags.__flags;
1391+
if (flags.unmapped) {
13821392
drm_gpusvm_notifier_unlock(gpusvm);
13831393
err = -EFAULT;
13841394
goto err_free;
@@ -1474,14 +1484,17 @@ int drm_gpusvm_range_get_pages(struct drm_gpusvm *gpusvm,
14741484
}
14751485
i += 1 << order;
14761486
num_dma_mapped = i;
1477-
range->flags.has_dma_mapping = true;
1487+
flags.has_dma_mapping = true;
14781488
}
14791489

14801490
if (zdd) {
1481-
range->flags.has_devmem_pages = true;
1491+
flags.has_devmem_pages = true;
14821492
range->dpagemap = dpagemap;
14831493
}
14841494

1495+
/* WRITE_ONCE pairs with READ_ONCE for opportunistic checks */
1496+
WRITE_ONCE(range->flags.__flags, flags.__flags);
1497+
14851498
drm_gpusvm_notifier_unlock(gpusvm);
14861499
kvfree(pfns);
14871500
set_seqno:

drivers/gpu/drm/xe/xe_module.c

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -30,9 +30,6 @@ struct xe_modparam xe_modparam = {
3030
module_param_named(svm_notifier_size, xe_modparam.svm_notifier_size, uint, 0600);
3131
MODULE_PARM_DESC(svm_notifier_size, "Set the svm notifier size(in MiB), must be power of 2");
3232

33-
module_param_named(always_migrate_to_vram, xe_modparam.always_migrate_to_vram, bool, 0444);
34-
MODULE_PARM_DESC(always_migrate_to_vram, "Always migrate to VRAM on GPU fault");
35-
3633
module_param_named_unsafe(force_execlist, xe_modparam.force_execlist, bool, 0444);
3734
MODULE_PARM_DESC(force_execlist, "Force Execlist submission");
3835

drivers/gpu/drm/xe/xe_module.h

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,6 @@
1212
struct xe_modparam {
1313
bool force_execlist;
1414
bool probe_display;
15-
bool always_migrate_to_vram;
1615
u32 force_vram_bar_size;
1716
int guc_log_level;
1817
char *guc_firmware_path;

drivers/gpu/drm/xe/xe_pt.c

Lines changed: 11 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -2270,11 +2270,19 @@ static void op_commit(struct xe_vm *vm,
22702270
}
22712271
case DRM_GPUVA_OP_DRIVER:
22722272
{
2273+
/* WRITE_ONCE pairs with READ_ONCE in xe_svm.c */
2274+
22732275
if (op->subop == XE_VMA_SUBOP_MAP_RANGE) {
2274-
op->map_range.range->tile_present |= BIT(tile->id);
2275-
op->map_range.range->tile_invalidated &= ~BIT(tile->id);
2276+
WRITE_ONCE(op->map_range.range->tile_present,
2277+
op->map_range.range->tile_present |
2278+
BIT(tile->id));
2279+
WRITE_ONCE(op->map_range.range->tile_invalidated,
2280+
op->map_range.range->tile_invalidated &
2281+
~BIT(tile->id));
22762282
} else if (op->subop == XE_VMA_SUBOP_UNMAP_RANGE) {
2277-
op->unmap_range.range->tile_present &= ~BIT(tile->id);
2283+
WRITE_ONCE(op->unmap_range.range->tile_present,
2284+
op->unmap_range.range->tile_present &
2285+
~BIT(tile->id));
22782286
}
22792287
break;
22802288
}

drivers/gpu/drm/xe/xe_svm.c

Lines changed: 85 additions & 26 deletions
Original file line numberDiff line numberDiff line change
@@ -16,8 +16,17 @@
1616

1717
static bool xe_svm_range_in_vram(struct xe_svm_range *range)
1818
{
19-
/* Not reliable without notifier lock */
20-
return range->base.flags.has_devmem_pages;
19+
/*
20+
* Advisory only check whether the range is currently backed by VRAM
21+
* memory.
22+
*/
23+
24+
struct drm_gpusvm_range_flags flags = {
25+
/* Pairs with WRITE_ONCE in drm_gpusvm.c */
26+
.__flags = READ_ONCE(range->base.flags.__flags),
27+
};
28+
29+
return flags.has_devmem_pages;
2130
}
2231

2332
static bool xe_svm_range_has_vram_binding(struct xe_svm_range *range)
@@ -650,9 +659,16 @@ void xe_svm_fini(struct xe_vm *vm)
650659
}
651660

652661
static bool xe_svm_range_is_valid(struct xe_svm_range *range,
653-
struct xe_tile *tile)
662+
struct xe_tile *tile,
663+
bool devmem_only)
654664
{
655-
return (range->tile_present & ~range->tile_invalidated) & BIT(tile->id);
665+
/*
666+
* Advisory only check whether the range currently has a valid mapping,
667+
* READ_ONCE pairs with WRITE_ONCE in xe_pt.c
668+
*/
669+
return ((READ_ONCE(range->tile_present) &
670+
~READ_ONCE(range->tile_invalidated)) & BIT(tile->id)) &&
671+
(!devmem_only || xe_svm_range_in_vram(range));
656672
}
657673

658674
#if IS_ENABLED(CONFIG_DRM_XE_DEVMEM_MIRROR)
@@ -726,6 +742,36 @@ static int xe_svm_alloc_vram(struct xe_vm *vm, struct xe_tile *tile,
726742
}
727743
#endif
728744

745+
static bool supports_4K_migration(struct xe_device *xe)
746+
{
747+
if (xe->info.vram_flags & XE_VRAM_FLAGS_NEED64K)
748+
return false;
749+
750+
return true;
751+
}
752+
753+
static bool xe_svm_range_needs_migrate_to_vram(struct xe_svm_range *range,
754+
struct xe_vma *vma)
755+
{
756+
struct xe_vm *vm = range_to_vm(&range->base);
757+
u64 range_size = xe_svm_range_size(range);
758+
759+
if (!range->base.flags.migrate_devmem)
760+
return false;
761+
762+
if (xe_svm_range_in_vram(range)) {
763+
drm_dbg(&vm->xe->drm, "Range is already in VRAM\n");
764+
return false;
765+
}
766+
767+
if (range_size <= SZ_64K && !supports_4K_migration(vm->xe)) {
768+
drm_dbg(&vm->xe->drm, "Platform doesn't support SZ_4K range migration\n");
769+
return false;
770+
}
771+
772+
return true;
773+
}
774+
729775
/**
730776
* xe_svm_handle_pagefault() - SVM handle page fault
731777
* @vm: The VM.
@@ -749,12 +795,15 @@ int xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,
749795
IS_ENABLED(CONFIG_DRM_XE_DEVMEM_MIRROR),
750796
.check_pages_threshold = IS_DGFX(vm->xe) &&
751797
IS_ENABLED(CONFIG_DRM_XE_DEVMEM_MIRROR) ? SZ_64K : 0,
798+
.devmem_only = atomic && IS_DGFX(vm->xe) &&
799+
IS_ENABLED(CONFIG_DRM_XE_DEVMEM_MIRROR),
752800
};
753801
struct xe_svm_range *range;
754802
struct drm_gpusvm_range *r;
755803
struct drm_exec exec;
756804
struct dma_fence *fence;
757805
struct xe_tile *tile = gt_to_tile(gt);
806+
int migrate_try_count = ctx.devmem_only ? 3 : 1;
758807
ktime_t end = 0;
759808
int err;
760809

@@ -775,40 +824,53 @@ int xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,
775824
if (IS_ERR(r))
776825
return PTR_ERR(r);
777826

827+
if (ctx.devmem_only && !r->flags.migrate_devmem)
828+
return -EACCES;
829+
778830
range = to_xe_range(r);
779-
if (xe_svm_range_is_valid(range, tile))
831+
if (xe_svm_range_is_valid(range, tile, ctx.devmem_only))
780832
return 0;
781833

782834
range_debug(range, "PAGE FAULT");
783835

784-
/* XXX: Add migration policy, for now migrate range once */
785-
if (!range->skip_migrate && range->base.flags.migrate_devmem &&
786-
xe_svm_range_size(range) >= SZ_64K) {
787-
range->skip_migrate = true;
788-
836+
if (--migrate_try_count >= 0 &&
837+
xe_svm_range_needs_migrate_to_vram(range, vma)) {
789838
err = xe_svm_alloc_vram(vm, tile, range, &ctx);
790839
if (err) {
791-
drm_dbg(&vm->xe->drm,
792-
"VRAM allocation failed, falling back to "
793-
"retrying fault, asid=%u, errno=%pe\n",
794-
vm->usm.asid, ERR_PTR(err));
795-
goto retry;
840+
if (migrate_try_count || !ctx.devmem_only) {
841+
drm_dbg(&vm->xe->drm,
842+
"VRAM allocation failed, falling back to retrying fault, asid=%u, errno=%pe\n",
843+
vm->usm.asid, ERR_PTR(err));
844+
goto retry;
845+
} else {
846+
drm_err(&vm->xe->drm,
847+
"VRAM allocation failed, retry count exceeded, asid=%u, errno=%pe\n",
848+
vm->usm.asid, ERR_PTR(err));
849+
return err;
850+
}
796851
}
797852
}
798853

799854
range_debug(range, "GET PAGES");
800855
err = drm_gpusvm_range_get_pages(&vm->svm.gpusvm, r, &ctx);
801856
/* Corner where CPU mappings have changed */
802857
if (err == -EOPNOTSUPP || err == -EFAULT || err == -EPERM) {
803-
if (err == -EOPNOTSUPP) {
804-
range_debug(range, "PAGE FAULT - EVICT PAGES");
805-
drm_gpusvm_range_evict(&vm->svm.gpusvm, &range->base);
858+
if (migrate_try_count > 0 || !ctx.devmem_only) {
859+
if (err == -EOPNOTSUPP) {
860+
range_debug(range, "PAGE FAULT - EVICT PAGES");
861+
drm_gpusvm_range_evict(&vm->svm.gpusvm,
862+
&range->base);
863+
}
864+
drm_dbg(&vm->xe->drm,
865+
"Get pages failed, falling back to retrying, asid=%u, gpusvm=%p, errno=%pe\n",
866+
vm->usm.asid, &vm->svm.gpusvm, ERR_PTR(err));
867+
range_debug(range, "PAGE FAULT - RETRY PAGES");
868+
goto retry;
869+
} else {
870+
drm_err(&vm->xe->drm,
871+
"Get pages failed, retry count exceeded, asid=%u, gpusvm=%p, errno=%pe\n",
872+
vm->usm.asid, &vm->svm.gpusvm, ERR_PTR(err));
806873
}
807-
drm_dbg(&vm->xe->drm,
808-
"Get pages failed, falling back to retrying, asid=%u, gpusvm=%p, errno=%pe\n",
809-
vm->usm.asid, &vm->svm.gpusvm, ERR_PTR(err));
810-
range_debug(range, "PAGE FAULT - RETRY PAGES");
811-
goto retry;
812874
}
813875
if (err) {
814876
range_debug(range, "PAGE FAULT - FAIL PAGE COLLECT");
@@ -842,9 +904,6 @@ int xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,
842904
}
843905
drm_exec_fini(&exec);
844906

845-
if (xe_modparam.always_migrate_to_vram)
846-
range->skip_migrate = false;
847-
848907
dma_fence_wait(fence, false);
849908
dma_fence_put(fence);
850909

drivers/gpu/drm/xe/xe_svm.h

Lines changed: 0 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -39,11 +39,6 @@ struct xe_svm_range {
3939
* range. Protected by GPU SVM notifier lock.
4040
*/
4141
u8 tile_invalidated;
42-
/**
43-
* @skip_migrate: Skip migration to VRAM, protected by GPU fault handler
44-
* locking.
45-
*/
46-
u8 skip_migrate :1;
4742
};
4843

4944
/**

include/drm/drm_gpusvm.h

Lines changed: 26 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -185,6 +185,31 @@ struct drm_gpusvm_notifier {
185185
} flags;
186186
};
187187

188+
/**
189+
* struct drm_gpusvm_range_flags - Structure representing a GPU SVM range flags
190+
*
191+
* @migrate_devmem: Flag indicating whether the range can be migrated to device memory
192+
* @unmapped: Flag indicating if the range has been unmapped
193+
* @partial_unmap: Flag indicating if the range has been partially unmapped
194+
* @has_devmem_pages: Flag indicating if the range has devmem pages
195+
* @has_dma_mapping: Flag indicating if the range has a DMA mapping
196+
* @__flags: Flags for range in u16 form (used for READ_ONCE)
197+
*/
198+
struct drm_gpusvm_range_flags {
199+
union {
200+
struct {
201+
/* All flags below must be set upon creation */
202+
u16 migrate_devmem : 1;
203+
/* All flags below must be set / cleared under notifier lock */
204+
u16 unmapped : 1;
205+
u16 partial_unmap : 1;
206+
u16 has_devmem_pages : 1;
207+
u16 has_dma_mapping : 1;
208+
};
209+
u16 __flags;
210+
};
211+
};
212+
188213
/**
189214
* struct drm_gpusvm_range - Structure representing a GPU SVM range
190215
*
@@ -198,11 +223,6 @@ struct drm_gpusvm_notifier {
198223
* @dpagemap: The struct drm_pagemap of the device pages we're dma-mapping.
199224
* Note this is assuming only one drm_pagemap per range is allowed.
200225
* @flags: Flags for range
201-
* @flags.migrate_devmem: Flag indicating whether the range can be migrated to device memory
202-
* @flags.unmapped: Flag indicating if the range has been unmapped
203-
* @flags.partial_unmap: Flag indicating if the range has been partially unmapped
204-
* @flags.has_devmem_pages: Flag indicating if the range has devmem pages
205-
* @flags.has_dma_mapping: Flag indicating if the range has a DMA mapping
206226
*
207227
* This structure represents a GPU SVM range used for tracking memory ranges
208228
* mapped in a DRM device.
@@ -216,15 +236,7 @@ struct drm_gpusvm_range {
216236
unsigned long notifier_seq;
217237
struct drm_pagemap_device_addr *dma_addr;
218238
struct drm_pagemap *dpagemap;
219-
struct {
220-
/* All flags below must be set upon creation */
221-
u16 migrate_devmem : 1;
222-
/* All flags below must be set / cleared under notifier lock */
223-
u16 unmapped : 1;
224-
u16 partial_unmap : 1;
225-
u16 has_devmem_pages : 1;
226-
u16 has_dma_mapping : 1;
227-
} flags;
239+
struct drm_gpusvm_range_flags flags;
228240
};
229241

230242
/**

0 commit comments

Comments
 (0)