drm/xe/migrate: Fix CCS copy for small VRAM copy chunks
[linux-2.6-microblaze.git] / drivers / gpu / drm / xe / tests / xe_migrate.c
1 // SPDX-License-Identifier: MIT
2 /*
3  * Copyright © 2020-2022 Intel Corporation
4  */
5
6 #include <kunit/test.h>
7 #include <kunit/visibility.h>
8
9 #include "tests/xe_migrate_test.h"
10 #include "tests/xe_pci_test.h"
11
12 #include "xe_pci.h"
13
14 static bool sanity_fence_failed(struct xe_device *xe, struct dma_fence *fence,
15                                 const char *str, struct kunit *test)
16 {
17         long ret;
18
19         if (IS_ERR(fence)) {
20                 KUNIT_FAIL(test, "Failed to create fence for %s: %li\n", str,
21                            PTR_ERR(fence));
22                 return true;
23         }
24         if (!fence)
25                 return true;
26
27         ret = dma_fence_wait_timeout(fence, false, 5 * HZ);
28         if (ret <= 0) {
29                 KUNIT_FAIL(test, "Fence timed out for %s: %li\n", str, ret);
30                 return true;
31         }
32
33         return false;
34 }
35
36 static int run_sanity_job(struct xe_migrate *m, struct xe_device *xe,
37                           struct xe_bb *bb, u32 second_idx, const char *str,
38                           struct kunit *test)
39 {
40         u64 batch_base = xe_migrate_batch_base(m, xe->info.has_usm);
41         struct xe_sched_job *job = xe_bb_create_migration_job(m->q, bb,
42                                                               batch_base,
43                                                               second_idx);
44         struct dma_fence *fence;
45
46         if (IS_ERR(job)) {
47                 KUNIT_FAIL(test, "Failed to allocate fake pt: %li\n",
48                            PTR_ERR(job));
49                 return PTR_ERR(job);
50         }
51
52         xe_sched_job_arm(job);
53         fence = dma_fence_get(&job->drm.s_fence->finished);
54         xe_sched_job_push(job);
55
56         if (sanity_fence_failed(xe, fence, str, test))
57                 return -ETIMEDOUT;
58
59         dma_fence_put(fence);
60         kunit_info(test, "%s: Job completed\n", str);
61         return 0;
62 }
63
64 static void
65 sanity_populate_cb(struct xe_migrate_pt_update *pt_update,
66                    struct xe_tile *tile, struct iosys_map *map, void *dst,
67                    u32 qword_ofs, u32 num_qwords,
68                    const struct xe_vm_pgtable_update *update)
69 {
70         struct migrate_test_params *p =
71                 to_migrate_test_params(xe_cur_kunit_priv(XE_TEST_LIVE_MIGRATE));
72         int i;
73         u64 *ptr = dst;
74         u64 value;
75
76         for (i = 0; i < num_qwords; i++) {
77                 value = (qword_ofs + i - update->ofs) * 0x1111111111111111ULL;
78                 if (map)
79                         xe_map_wr(tile_to_xe(tile), map, (qword_ofs + i) *
80                                   sizeof(u64), u64, value);
81                 else
82                         ptr[i] = value;
83         }
84
85         kunit_info(xe_cur_kunit(), "Used %s.\n", map ? "CPU" : "GPU");
86         if (p->force_gpu && map)
87                 KUNIT_FAIL(xe_cur_kunit(), "GPU pagetable update used CPU.\n");
88 }
89
90 static const struct xe_migrate_pt_update_ops sanity_ops = {
91         .populate = sanity_populate_cb,
92 };
93
94 #define check(_retval, _expected, str, _test)                           \
95         do { if ((_retval) != (_expected)) {                            \
96                         KUNIT_FAIL(_test, "Sanity check failed: " str   \
97                                    " expected %llx, got %llx\n",        \
98                                    (u64)(_expected), (u64)(_retval));   \
99                 } } while (0)
100
101 static void test_copy(struct xe_migrate *m, struct xe_bo *bo,
102                       struct kunit *test, u32 region)
103 {
104         struct xe_device *xe = tile_to_xe(m->tile);
105         u64 retval, expected = 0;
106         bool big = bo->size >= SZ_2M;
107         struct dma_fence *fence;
108         const char *str = big ? "Copying big bo" : "Copying small bo";
109         int err;
110
111         struct xe_bo *remote = xe_bo_create_locked(xe, m->tile, NULL,
112                                                    bo->size,
113                                                    ttm_bo_type_kernel,
114                                                    region |
115                                                    XE_BO_NEEDS_CPU_ACCESS);
116         if (IS_ERR(remote)) {
117                 KUNIT_FAIL(test, "Failed to allocate remote bo for %s: %li\n",
118                            str, PTR_ERR(remote));
119                 return;
120         }
121
122         err = xe_bo_validate(remote, NULL, false);
123         if (err) {
124                 KUNIT_FAIL(test, "Failed to validate system bo for %s: %li\n",
125                            str, err);
126                 goto out_unlock;
127         }
128
129         err = xe_bo_vmap(remote);
130         if (err) {
131                 KUNIT_FAIL(test, "Failed to vmap system bo for %s: %li\n",
132                            str, err);
133                 goto out_unlock;
134         }
135
136         xe_map_memset(xe, &remote->vmap, 0, 0xd0, remote->size);
137         fence = xe_migrate_clear(m, remote, remote->ttm.resource);
138         if (!sanity_fence_failed(xe, fence, big ? "Clearing remote big bo" :
139                                  "Clearing remote small bo", test)) {
140                 retval = xe_map_rd(xe, &remote->vmap, 0, u64);
141                 check(retval, expected, "remote first offset should be cleared",
142                       test);
143                 retval = xe_map_rd(xe, &remote->vmap, remote->size - 8, u64);
144                 check(retval, expected, "remote last offset should be cleared",
145                       test);
146         }
147         dma_fence_put(fence);
148
149         /* Try to copy 0xc0 from remote to vram with 2MB or 64KiB/4KiB pages */
150         xe_map_memset(xe, &remote->vmap, 0, 0xc0, remote->size);
151         xe_map_memset(xe, &bo->vmap, 0, 0xd0, bo->size);
152
153         expected = 0xc0c0c0c0c0c0c0c0;
154         fence = xe_migrate_copy(m, remote, bo, remote->ttm.resource,
155                                 bo->ttm.resource, false);
156         if (!sanity_fence_failed(xe, fence, big ? "Copying big bo remote -> vram" :
157                                  "Copying small bo remote -> vram", test)) {
158                 retval = xe_map_rd(xe, &bo->vmap, 0, u64);
159                 check(retval, expected,
160                       "remote -> vram bo first offset should be copied", test);
161                 retval = xe_map_rd(xe, &bo->vmap, bo->size - 8, u64);
162                 check(retval, expected,
163                       "remote -> vram bo offset should be copied", test);
164         }
165         dma_fence_put(fence);
166
167         /* And other way around.. slightly hacky.. */
168         xe_map_memset(xe, &remote->vmap, 0, 0xd0, remote->size);
169         xe_map_memset(xe, &bo->vmap, 0, 0xc0, bo->size);
170
171         fence = xe_migrate_copy(m, bo, remote, bo->ttm.resource,
172                                 remote->ttm.resource, false);
173         if (!sanity_fence_failed(xe, fence, big ? "Copying big bo vram -> remote" :
174                                  "Copying small bo vram -> remote", test)) {
175                 retval = xe_map_rd(xe, &remote->vmap, 0, u64);
176                 check(retval, expected,
177                       "vram -> remote bo first offset should be copied", test);
178                 retval = xe_map_rd(xe, &remote->vmap, bo->size - 8, u64);
179                 check(retval, expected,
180                       "vram -> remote bo last offset should be copied", test);
181         }
182         dma_fence_put(fence);
183
184         xe_bo_vunmap(remote);
185 out_unlock:
186         xe_bo_unlock(remote);
187         xe_bo_put(remote);
188 }
189
190 static void test_copy_sysmem(struct xe_migrate *m, struct xe_bo *bo,
191                              struct kunit *test)
192 {
193         test_copy(m, bo, test, XE_BO_CREATE_SYSTEM_BIT);
194 }
195
196 static void test_copy_vram(struct xe_migrate *m, struct xe_bo *bo,
197                            struct kunit *test)
198 {
199         u32 region;
200
201         if (bo->ttm.resource->mem_type == XE_PL_SYSTEM)
202                 return;
203
204         if (bo->ttm.resource->mem_type == XE_PL_VRAM0)
205                 region = XE_BO_CREATE_VRAM1_BIT;
206         else
207                 region = XE_BO_CREATE_VRAM0_BIT;
208         test_copy(m, bo, test, region);
209 }
210
211 static void test_pt_update(struct xe_migrate *m, struct xe_bo *pt,
212                            struct kunit *test, bool force_gpu)
213 {
214         struct xe_device *xe = tile_to_xe(m->tile);
215         struct dma_fence *fence;
216         u64 retval, expected;
217         ktime_t then, now;
218         int i;
219
220         struct xe_vm_pgtable_update update = {
221                 .ofs = 1,
222                 .qwords = 0x10,
223                 .pt_bo = pt,
224         };
225         struct xe_migrate_pt_update pt_update = {
226                 .ops = &sanity_ops,
227         };
228         struct migrate_test_params p = {
229                 .base.id = XE_TEST_LIVE_MIGRATE,
230                 .force_gpu = force_gpu,
231         };
232
233         test->priv = &p;
234         /* Test xe_migrate_update_pgtables() updates the pagetable as expected */
235         expected = 0xf0f0f0f0f0f0f0f0ULL;
236         xe_map_memset(xe, &pt->vmap, 0, (u8)expected, pt->size);
237
238         then = ktime_get();
239         fence = xe_migrate_update_pgtables(m, m->q->vm, NULL, m->q, &update, 1,
240                                            NULL, 0, &pt_update);
241         now = ktime_get();
242         if (sanity_fence_failed(xe, fence, "Migration pagetable update", test))
243                 return;
244
245         kunit_info(test, "Updating without syncing took %llu us,\n",
246                    (unsigned long long)ktime_to_us(ktime_sub(now, then)));
247
248         dma_fence_put(fence);
249         retval = xe_map_rd(xe, &pt->vmap, 0, u64);
250         check(retval, expected, "PTE[0] must stay untouched", test);
251
252         for (i = 0; i < update.qwords; i++) {
253                 retval = xe_map_rd(xe, &pt->vmap, (update.ofs + i) * 8, u64);
254                 check(retval, i * 0x1111111111111111ULL, "PTE update", test);
255         }
256
257         retval = xe_map_rd(xe, &pt->vmap, 8 * (update.ofs + update.qwords),
258                            u64);
259         check(retval, expected, "PTE[0x11] must stay untouched", test);
260 }
261
262 static void xe_migrate_sanity_test(struct xe_migrate *m, struct kunit *test)
263 {
264         struct xe_tile *tile = m->tile;
265         struct xe_device *xe = tile_to_xe(tile);
266         struct xe_bo *pt, *bo = m->pt_bo, *big, *tiny;
267         struct xe_res_cursor src_it;
268         struct dma_fence *fence;
269         u64 retval, expected;
270         struct xe_bb *bb;
271         int err;
272         u8 id = tile->id;
273
274         err = xe_bo_vmap(bo);
275         if (err) {
276                 KUNIT_FAIL(test, "Failed to vmap our pagetables: %li\n",
277                            PTR_ERR(bo));
278                 return;
279         }
280
281         big = xe_bo_create_pin_map(xe, tile, m->q->vm, SZ_4M,
282                                    ttm_bo_type_kernel,
283                                    XE_BO_CREATE_VRAM_IF_DGFX(tile) |
284                                    XE_BO_CREATE_PINNED_BIT);
285         if (IS_ERR(big)) {
286                 KUNIT_FAIL(test, "Failed to allocate bo: %li\n", PTR_ERR(big));
287                 goto vunmap;
288         }
289
290         pt = xe_bo_create_pin_map(xe, tile, m->q->vm, XE_PAGE_SIZE,
291                                   ttm_bo_type_kernel,
292                                   XE_BO_CREATE_VRAM_IF_DGFX(tile) |
293                                   XE_BO_CREATE_PINNED_BIT);
294         if (IS_ERR(pt)) {
295                 KUNIT_FAIL(test, "Failed to allocate fake pt: %li\n",
296                            PTR_ERR(pt));
297                 goto free_big;
298         }
299
300         tiny = xe_bo_create_pin_map(xe, tile, m->q->vm,
301                                     2 * SZ_4K,
302                                     ttm_bo_type_kernel,
303                                     XE_BO_CREATE_VRAM_IF_DGFX(tile) |
304                                     XE_BO_CREATE_PINNED_BIT);
305         if (IS_ERR(tiny)) {
306                 KUNIT_FAIL(test, "Failed to allocate fake pt: %li\n",
307                            PTR_ERR(pt));
308                 goto free_pt;
309         }
310
311         bb = xe_bb_new(tile->primary_gt, 32, xe->info.has_usm);
312         if (IS_ERR(bb)) {
313                 KUNIT_FAIL(test, "Failed to create batchbuffer: %li\n",
314                            PTR_ERR(bb));
315                 goto free_tiny;
316         }
317
318         kunit_info(test, "Starting tests, top level PT addr: %lx, special pagetable base addr: %lx\n",
319                    (unsigned long)xe_bo_main_addr(m->q->vm->pt_root[id]->bo, XE_PAGE_SIZE),
320                    (unsigned long)xe_bo_main_addr(m->pt_bo, XE_PAGE_SIZE));
321
322         /* First part of the test, are we updating our pagetable bo with a new entry? */
323         xe_map_wr(xe, &bo->vmap, XE_PAGE_SIZE * (NUM_KERNEL_PDE - 1), u64,
324                   0xdeaddeadbeefbeef);
325         expected = m->q->vm->pt_ops->pte_encode_bo(pt, 0, xe->pat.idx[XE_CACHE_WB], 0);
326         if (m->q->vm->flags & XE_VM_FLAG_64K)
327                 expected |= XE_PTE_PS64;
328         if (xe_bo_is_vram(pt))
329                 xe_res_first(pt->ttm.resource, 0, pt->size, &src_it);
330         else
331                 xe_res_first_sg(xe_bo_sg(pt), 0, pt->size, &src_it);
332
333         emit_pte(m, bb, NUM_KERNEL_PDE - 1, xe_bo_is_vram(pt), false,
334                  &src_it, XE_PAGE_SIZE, pt->ttm.resource);
335
336         run_sanity_job(m, xe, bb, bb->len, "Writing PTE for our fake PT", test);
337
338         retval = xe_map_rd(xe, &bo->vmap, XE_PAGE_SIZE * (NUM_KERNEL_PDE - 1),
339                            u64);
340         check(retval, expected, "PTE entry write", test);
341
342         /* Now try to write data to our newly mapped 'pagetable', see if it succeeds */
343         bb->len = 0;
344         bb->cs[bb->len++] = MI_BATCH_BUFFER_END;
345         xe_map_wr(xe, &pt->vmap, 0, u32, 0xdeaddead);
346         expected = 0;
347
348         emit_clear(tile->primary_gt, bb, xe_migrate_vm_addr(NUM_KERNEL_PDE - 1, 0), 4, 4,
349                    IS_DGFX(xe));
350         run_sanity_job(m, xe, bb, 1, "Writing to our newly mapped pagetable",
351                        test);
352
353         retval = xe_map_rd(xe, &pt->vmap, 0, u32);
354         check(retval, expected, "Write to PT after adding PTE", test);
355
356         /* Sanity checks passed, try the full ones! */
357
358         /* Clear a small bo */
359         kunit_info(test, "Clearing small buffer object\n");
360         xe_map_memset(xe, &tiny->vmap, 0, 0x22, tiny->size);
361         expected = 0;
362         fence = xe_migrate_clear(m, tiny, tiny->ttm.resource);
363         if (sanity_fence_failed(xe, fence, "Clearing small bo", test))
364                 goto out;
365
366         dma_fence_put(fence);
367         retval = xe_map_rd(xe, &tiny->vmap, 0, u32);
368         check(retval, expected, "Command clear small first value", test);
369         retval = xe_map_rd(xe, &tiny->vmap, tiny->size - 4, u32);
370         check(retval, expected, "Command clear small last value", test);
371
372         kunit_info(test, "Copying small buffer object to system\n");
373         test_copy_sysmem(m, tiny, test);
374         if (xe->info.tile_count > 1) {
375                 kunit_info(test, "Copying small buffer object to other vram\n");
376                 test_copy_vram(m, tiny, test);
377         }
378
379         /* Clear a big bo */
380         kunit_info(test, "Clearing big buffer object\n");
381         xe_map_memset(xe, &big->vmap, 0, 0x11, big->size);
382         expected = 0;
383         fence = xe_migrate_clear(m, big, big->ttm.resource);
384         if (sanity_fence_failed(xe, fence, "Clearing big bo", test))
385                 goto out;
386
387         dma_fence_put(fence);
388         retval = xe_map_rd(xe, &big->vmap, 0, u32);
389         check(retval, expected, "Command clear big first value", test);
390         retval = xe_map_rd(xe, &big->vmap, big->size - 4, u32);
391         check(retval, expected, "Command clear big last value", test);
392
393         kunit_info(test, "Copying big buffer object to system\n");
394         test_copy_sysmem(m, big, test);
395         if (xe->info.tile_count > 1) {
396                 kunit_info(test, "Copying big buffer object to other vram\n");
397                 test_copy_vram(m, big, test);
398         }
399
400         kunit_info(test, "Testing page table update using CPU if GPU idle.\n");
401         test_pt_update(m, pt, test, false);
402         kunit_info(test, "Testing page table update using GPU\n");
403         test_pt_update(m, pt, test, true);
404
405 out:
406         xe_bb_free(bb, NULL);
407 free_tiny:
408         xe_bo_unpin(tiny);
409         xe_bo_put(tiny);
410 free_pt:
411         xe_bo_unpin(pt);
412         xe_bo_put(pt);
413 free_big:
414         xe_bo_unpin(big);
415         xe_bo_put(big);
416 vunmap:
417         xe_bo_vunmap(m->pt_bo);
418 }
419
420 static int migrate_test_run_device(struct xe_device *xe)
421 {
422         struct kunit *test = xe_cur_kunit();
423         struct xe_tile *tile;
424         int id;
425
426         for_each_tile(tile, xe, id) {
427                 struct xe_migrate *m = tile->migrate;
428
429                 kunit_info(test, "Testing tile id %d.\n", id);
430                 xe_vm_lock(m->q->vm, true);
431                 xe_device_mem_access_get(xe);
432                 xe_migrate_sanity_test(m, test);
433                 xe_device_mem_access_put(xe);
434                 xe_vm_unlock(m->q->vm);
435         }
436
437         return 0;
438 }
439
440 void xe_migrate_sanity_kunit(struct kunit *test)
441 {
442         xe_call_for_each_device(migrate_test_run_device);
443 }
444 EXPORT_SYMBOL_IF_KUNIT(xe_migrate_sanity_kunit);