Linux kernel mirror (for testing)
git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel
os
linux
1// SPDX-License-Identifier: GPL-2.0
2/*
3 * Copyright (C) 2024, Advanced Micro Devices, Inc.
4 */
5
6#include <drm/amdxdna_accel.h>
7#include <drm/drm_cache.h>
8#include <drm/drm_device.h>
9#include <drm/drm_gem.h>
10#include <drm/drm_gem_shmem_helper.h>
11#include <drm/gpu_scheduler.h>
12#include <linux/dma-buf.h>
13#include <linux/dma-direct.h>
14#include <linux/iosys-map.h>
15#include <linux/pagemap.h>
16#include <linux/vmalloc.h>
17
18#include "amdxdna_ctx.h"
19#include "amdxdna_gem.h"
20#include "amdxdna_pci_drv.h"
21
22#define XDNA_MAX_CMD_BO_SIZE SZ_32K
23
24MODULE_IMPORT_NS("DMA_BUF");
25
26static int
27amdxdna_gem_heap_alloc(struct amdxdna_gem_obj *abo)
28{
29 struct amdxdna_client *client = abo->client;
30 struct amdxdna_dev *xdna = client->xdna;
31 struct amdxdna_mem *mem = &abo->mem;
32 struct amdxdna_gem_obj *heap;
33 u64 offset;
34 u32 align;
35 int ret;
36
37 mutex_lock(&client->mm_lock);
38
39 heap = client->dev_heap;
40 if (!heap) {
41 ret = -EINVAL;
42 goto unlock_out;
43 }
44
45 if (heap->mem.userptr == AMDXDNA_INVALID_ADDR) {
46 XDNA_ERR(xdna, "Invalid dev heap userptr");
47 ret = -EINVAL;
48 goto unlock_out;
49 }
50
51 if (mem->size == 0 || mem->size > heap->mem.size) {
52 XDNA_ERR(xdna, "Invalid dev bo size 0x%lx, limit 0x%lx",
53 mem->size, heap->mem.size);
54 ret = -EINVAL;
55 goto unlock_out;
56 }
57
58 align = 1 << max(PAGE_SHIFT, xdna->dev_info->dev_mem_buf_shift);
59 ret = drm_mm_insert_node_generic(&heap->mm, &abo->mm_node,
60 mem->size, align,
61 0, DRM_MM_INSERT_BEST);
62 if (ret) {
63 XDNA_ERR(xdna, "Failed to alloc dev bo memory, ret %d", ret);
64 goto unlock_out;
65 }
66
67 mem->dev_addr = abo->mm_node.start;
68 offset = mem->dev_addr - heap->mem.dev_addr;
69 mem->userptr = heap->mem.userptr + offset;
70 mem->kva = heap->mem.kva + offset;
71
72 drm_gem_object_get(to_gobj(heap));
73
74unlock_out:
75 mutex_unlock(&client->mm_lock);
76
77 return ret;
78}
79
80static void
81amdxdna_gem_destroy_obj(struct amdxdna_gem_obj *abo)
82{
83 mutex_destroy(&abo->lock);
84 kfree(abo);
85}
86
87static void
88amdxdna_gem_heap_free(struct amdxdna_gem_obj *abo)
89{
90 struct amdxdna_gem_obj *heap;
91
92 mutex_lock(&abo->client->mm_lock);
93
94 drm_mm_remove_node(&abo->mm_node);
95
96 heap = abo->client->dev_heap;
97 drm_gem_object_put(to_gobj(heap));
98
99 mutex_unlock(&abo->client->mm_lock);
100}
101
102static bool amdxdna_hmm_invalidate(struct mmu_interval_notifier *mni,
103 const struct mmu_notifier_range *range,
104 unsigned long cur_seq)
105{
106 struct amdxdna_umap *mapp = container_of(mni, struct amdxdna_umap, notifier);
107 struct amdxdna_gem_obj *abo = mapp->abo;
108 struct amdxdna_dev *xdna;
109
110 xdna = to_xdna_dev(to_gobj(abo)->dev);
111 XDNA_DBG(xdna, "Invalidating range 0x%lx, 0x%lx, type %d",
112 mapp->vma->vm_start, mapp->vma->vm_end, abo->type);
113
114 if (!mmu_notifier_range_blockable(range))
115 return false;
116
117 down_write(&xdna->notifier_lock);
118 abo->mem.map_invalid = true;
119 mapp->invalid = true;
120 mmu_interval_set_seq(&mapp->notifier, cur_seq);
121 up_write(&xdna->notifier_lock);
122
123 xdna->dev_info->ops->hmm_invalidate(abo, cur_seq);
124
125 if (range->event == MMU_NOTIFY_UNMAP) {
126 down_write(&xdna->notifier_lock);
127 if (!mapp->unmapped) {
128 queue_work(xdna->notifier_wq, &mapp->hmm_unreg_work);
129 mapp->unmapped = true;
130 }
131 up_write(&xdna->notifier_lock);
132 }
133
134 return true;
135}
136
137static const struct mmu_interval_notifier_ops amdxdna_hmm_ops = {
138 .invalidate = amdxdna_hmm_invalidate,
139};
140
141static void amdxdna_hmm_unregister(struct amdxdna_gem_obj *abo,
142 struct vm_area_struct *vma)
143{
144 struct amdxdna_dev *xdna = to_xdna_dev(to_gobj(abo)->dev);
145 struct amdxdna_umap *mapp;
146
147 down_read(&xdna->notifier_lock);
148 list_for_each_entry(mapp, &abo->mem.umap_list, node) {
149 if (!vma || mapp->vma == vma) {
150 if (!mapp->unmapped) {
151 queue_work(xdna->notifier_wq, &mapp->hmm_unreg_work);
152 mapp->unmapped = true;
153 }
154 if (vma)
155 break;
156 }
157 }
158 up_read(&xdna->notifier_lock);
159}
160
161static void amdxdna_umap_release(struct kref *ref)
162{
163 struct amdxdna_umap *mapp = container_of(ref, struct amdxdna_umap, refcnt);
164 struct vm_area_struct *vma = mapp->vma;
165 struct amdxdna_dev *xdna;
166
167 mmu_interval_notifier_remove(&mapp->notifier);
168 if (is_import_bo(mapp->abo) && vma->vm_file && vma->vm_file->f_mapping)
169 mapping_clear_unevictable(vma->vm_file->f_mapping);
170
171 xdna = to_xdna_dev(to_gobj(mapp->abo)->dev);
172 down_write(&xdna->notifier_lock);
173 list_del(&mapp->node);
174 up_write(&xdna->notifier_lock);
175
176 kvfree(mapp->range.hmm_pfns);
177 kfree(mapp);
178}
179
180void amdxdna_umap_put(struct amdxdna_umap *mapp)
181{
182 kref_put(&mapp->refcnt, amdxdna_umap_release);
183}
184
185static void amdxdna_hmm_unreg_work(struct work_struct *work)
186{
187 struct amdxdna_umap *mapp = container_of(work, struct amdxdna_umap,
188 hmm_unreg_work);
189
190 amdxdna_umap_put(mapp);
191}
192
193static int amdxdna_hmm_register(struct amdxdna_gem_obj *abo,
194 struct vm_area_struct *vma)
195{
196 struct amdxdna_dev *xdna = to_xdna_dev(to_gobj(abo)->dev);
197 unsigned long len = vma->vm_end - vma->vm_start;
198 unsigned long addr = vma->vm_start;
199 struct amdxdna_umap *mapp;
200 u32 nr_pages;
201 int ret;
202
203 if (!xdna->dev_info->ops->hmm_invalidate)
204 return 0;
205
206 mapp = kzalloc(sizeof(*mapp), GFP_KERNEL);
207 if (!mapp)
208 return -ENOMEM;
209
210 nr_pages = (PAGE_ALIGN(addr + len) - (addr & PAGE_MASK)) >> PAGE_SHIFT;
211 mapp->range.hmm_pfns = kvcalloc(nr_pages, sizeof(*mapp->range.hmm_pfns),
212 GFP_KERNEL);
213 if (!mapp->range.hmm_pfns) {
214 ret = -ENOMEM;
215 goto free_map;
216 }
217
218 ret = mmu_interval_notifier_insert_locked(&mapp->notifier,
219 current->mm,
220 addr,
221 len,
222 &amdxdna_hmm_ops);
223 if (ret) {
224 XDNA_ERR(xdna, "Insert mmu notifier failed, ret %d", ret);
225 goto free_pfns;
226 }
227
228 mapp->range.notifier = &mapp->notifier;
229 mapp->range.start = vma->vm_start;
230 mapp->range.end = vma->vm_end;
231 mapp->range.default_flags = HMM_PFN_REQ_FAULT;
232 mapp->vma = vma;
233 mapp->abo = abo;
234 kref_init(&mapp->refcnt);
235
236 if (abo->mem.userptr == AMDXDNA_INVALID_ADDR)
237 abo->mem.userptr = addr;
238 INIT_WORK(&mapp->hmm_unreg_work, amdxdna_hmm_unreg_work);
239 if (is_import_bo(abo) && vma->vm_file && vma->vm_file->f_mapping)
240 mapping_set_unevictable(vma->vm_file->f_mapping);
241
242 down_write(&xdna->notifier_lock);
243 list_add_tail(&mapp->node, &abo->mem.umap_list);
244 up_write(&xdna->notifier_lock);
245
246 return 0;
247
248free_pfns:
249 kvfree(mapp->range.hmm_pfns);
250free_map:
251 kfree(mapp);
252 return ret;
253}
254
255static void amdxdna_gem_dev_obj_free(struct drm_gem_object *gobj)
256{
257 struct amdxdna_dev *xdna = to_xdna_dev(gobj->dev);
258 struct amdxdna_gem_obj *abo = to_xdna_obj(gobj);
259
260 XDNA_DBG(xdna, "BO type %d xdna_addr 0x%llx", abo->type, abo->mem.dev_addr);
261 if (abo->pinned)
262 amdxdna_gem_unpin(abo);
263
264 amdxdna_gem_heap_free(abo);
265 drm_gem_object_release(gobj);
266 amdxdna_gem_destroy_obj(abo);
267}
268
269static int amdxdna_insert_pages(struct amdxdna_gem_obj *abo,
270 struct vm_area_struct *vma)
271{
272 struct amdxdna_dev *xdna = to_xdna_dev(to_gobj(abo)->dev);
273 unsigned long num_pages = vma_pages(vma);
274 unsigned long offset = 0;
275 int ret;
276
277 if (!is_import_bo(abo)) {
278 ret = drm_gem_shmem_mmap(&abo->base, vma);
279 if (ret) {
280 XDNA_ERR(xdna, "Failed shmem mmap %d", ret);
281 return ret;
282 }
283
284 /* The buffer is based on memory pages. Fix the flag. */
285 vm_flags_mod(vma, VM_MIXEDMAP, VM_PFNMAP);
286 ret = vm_insert_pages(vma, vma->vm_start, abo->base.pages,
287 &num_pages);
288 if (ret) {
289 XDNA_ERR(xdna, "Failed insert pages %d", ret);
290 vma->vm_ops->close(vma);
291 return ret;
292 }
293
294 return 0;
295 }
296
297 vma->vm_private_data = NULL;
298 vma->vm_ops = NULL;
299 ret = dma_buf_mmap(to_gobj(abo)->dma_buf, vma, 0);
300 if (ret) {
301 XDNA_ERR(xdna, "Failed to mmap dma buf %d", ret);
302 return ret;
303 }
304
305 do {
306 vm_fault_t fault_ret;
307
308 fault_ret = handle_mm_fault(vma, vma->vm_start + offset,
309 FAULT_FLAG_WRITE, NULL);
310 if (fault_ret & VM_FAULT_ERROR) {
311 vma->vm_ops->close(vma);
312 XDNA_ERR(xdna, "Fault in page failed");
313 return -EFAULT;
314 }
315
316 offset += PAGE_SIZE;
317 } while (--num_pages);
318
319 /* Drop the reference drm_gem_mmap_obj() acquired.*/
320 drm_gem_object_put(to_gobj(abo));
321
322 return 0;
323}
324
325static int amdxdna_gem_obj_mmap(struct drm_gem_object *gobj,
326 struct vm_area_struct *vma)
327{
328 struct amdxdna_dev *xdna = to_xdna_dev(gobj->dev);
329 struct amdxdna_gem_obj *abo = to_xdna_obj(gobj);
330 int ret;
331
332 ret = amdxdna_hmm_register(abo, vma);
333 if (ret)
334 return ret;
335
336 ret = amdxdna_insert_pages(abo, vma);
337 if (ret) {
338 XDNA_ERR(xdna, "Failed insert pages, ret %d", ret);
339 goto hmm_unreg;
340 }
341
342 XDNA_DBG(xdna, "BO map_offset 0x%llx type %d userptr 0x%lx size 0x%lx",
343 drm_vma_node_offset_addr(&gobj->vma_node), abo->type,
344 vma->vm_start, gobj->size);
345 return 0;
346
347hmm_unreg:
348 amdxdna_hmm_unregister(abo, vma);
349 return ret;
350}
351
352static int amdxdna_gem_dmabuf_mmap(struct dma_buf *dma_buf, struct vm_area_struct *vma)
353{
354 struct drm_gem_object *gobj = dma_buf->priv;
355 struct amdxdna_gem_obj *abo = to_xdna_obj(gobj);
356 unsigned long num_pages = vma_pages(vma);
357 int ret;
358
359 vma->vm_ops = &drm_gem_shmem_vm_ops;
360 vma->vm_private_data = gobj;
361
362 drm_gem_object_get(gobj);
363 ret = drm_gem_shmem_mmap(&abo->base, vma);
364 if (ret)
365 goto put_obj;
366
367 /* The buffer is based on memory pages. Fix the flag. */
368 vm_flags_mod(vma, VM_MIXEDMAP, VM_PFNMAP);
369 ret = vm_insert_pages(vma, vma->vm_start, abo->base.pages,
370 &num_pages);
371 if (ret)
372 goto close_vma;
373
374 return 0;
375
376close_vma:
377 vma->vm_ops->close(vma);
378put_obj:
379 drm_gem_object_put(gobj);
380 return ret;
381}
382
383static const struct dma_buf_ops amdxdna_dmabuf_ops = {
384 .attach = drm_gem_map_attach,
385 .detach = drm_gem_map_detach,
386 .map_dma_buf = drm_gem_map_dma_buf,
387 .unmap_dma_buf = drm_gem_unmap_dma_buf,
388 .release = drm_gem_dmabuf_release,
389 .mmap = amdxdna_gem_dmabuf_mmap,
390 .vmap = drm_gem_dmabuf_vmap,
391 .vunmap = drm_gem_dmabuf_vunmap,
392};
393
394static struct dma_buf *amdxdna_gem_prime_export(struct drm_gem_object *gobj, int flags)
395{
396 DEFINE_DMA_BUF_EXPORT_INFO(exp_info);
397
398 exp_info.ops = &amdxdna_dmabuf_ops;
399 exp_info.size = gobj->size;
400 exp_info.flags = flags;
401 exp_info.priv = gobj;
402 exp_info.resv = gobj->resv;
403
404 return drm_gem_dmabuf_export(gobj->dev, &exp_info);
405}
406
407static void amdxdna_imported_obj_free(struct amdxdna_gem_obj *abo)
408{
409 dma_buf_unmap_attachment_unlocked(abo->attach, abo->base.sgt, DMA_BIDIRECTIONAL);
410 dma_buf_detach(abo->dma_buf, abo->attach);
411 dma_buf_put(abo->dma_buf);
412 drm_gem_object_release(to_gobj(abo));
413 kfree(abo);
414}
415
416static void amdxdna_gem_obj_free(struct drm_gem_object *gobj)
417{
418 struct amdxdna_dev *xdna = to_xdna_dev(gobj->dev);
419 struct amdxdna_gem_obj *abo = to_xdna_obj(gobj);
420 struct iosys_map map = IOSYS_MAP_INIT_VADDR(abo->mem.kva);
421
422 XDNA_DBG(xdna, "BO type %d xdna_addr 0x%llx", abo->type, abo->mem.dev_addr);
423
424 amdxdna_hmm_unregister(abo, NULL);
425 flush_workqueue(xdna->notifier_wq);
426
427 if (abo->pinned)
428 amdxdna_gem_unpin(abo);
429
430 if (abo->type == AMDXDNA_BO_DEV_HEAP)
431 drm_mm_takedown(&abo->mm);
432
433 drm_gem_vunmap(gobj, &map);
434 mutex_destroy(&abo->lock);
435
436 if (is_import_bo(abo)) {
437 amdxdna_imported_obj_free(abo);
438 return;
439 }
440
441 drm_gem_shmem_free(&abo->base);
442}
443
444static const struct drm_gem_object_funcs amdxdna_gem_dev_obj_funcs = {
445 .free = amdxdna_gem_dev_obj_free,
446};
447
448static const struct drm_gem_object_funcs amdxdna_gem_shmem_funcs = {
449 .free = amdxdna_gem_obj_free,
450 .print_info = drm_gem_shmem_object_print_info,
451 .pin = drm_gem_shmem_object_pin,
452 .unpin = drm_gem_shmem_object_unpin,
453 .get_sg_table = drm_gem_shmem_object_get_sg_table,
454 .vmap = drm_gem_shmem_object_vmap,
455 .vunmap = drm_gem_shmem_object_vunmap,
456 .mmap = amdxdna_gem_obj_mmap,
457 .vm_ops = &drm_gem_shmem_vm_ops,
458 .export = amdxdna_gem_prime_export,
459};
460
461static struct amdxdna_gem_obj *
462amdxdna_gem_create_obj(struct drm_device *dev, size_t size)
463{
464 struct amdxdna_gem_obj *abo;
465
466 abo = kzalloc(sizeof(*abo), GFP_KERNEL);
467 if (!abo)
468 return ERR_PTR(-ENOMEM);
469
470 abo->pinned = false;
471 abo->assigned_hwctx = AMDXDNA_INVALID_CTX_HANDLE;
472 mutex_init(&abo->lock);
473
474 abo->mem.userptr = AMDXDNA_INVALID_ADDR;
475 abo->mem.dev_addr = AMDXDNA_INVALID_ADDR;
476 abo->mem.size = size;
477 INIT_LIST_HEAD(&abo->mem.umap_list);
478
479 return abo;
480}
481
482/* For drm_driver->gem_create_object callback */
483struct drm_gem_object *
484amdxdna_gem_create_object_cb(struct drm_device *dev, size_t size)
485{
486 struct amdxdna_gem_obj *abo;
487
488 abo = amdxdna_gem_create_obj(dev, size);
489 if (IS_ERR(abo))
490 return ERR_CAST(abo);
491
492 to_gobj(abo)->funcs = &amdxdna_gem_shmem_funcs;
493
494 return to_gobj(abo);
495}
496
497struct drm_gem_object *
498amdxdna_gem_prime_import(struct drm_device *dev, struct dma_buf *dma_buf)
499{
500 struct dma_buf_attachment *attach;
501 struct amdxdna_gem_obj *abo;
502 struct drm_gem_object *gobj;
503 struct sg_table *sgt;
504 int ret;
505
506 get_dma_buf(dma_buf);
507
508 attach = dma_buf_attach(dma_buf, dev->dev);
509 if (IS_ERR(attach)) {
510 ret = PTR_ERR(attach);
511 goto put_buf;
512 }
513
514 sgt = dma_buf_map_attachment_unlocked(attach, DMA_BIDIRECTIONAL);
515 if (IS_ERR(sgt)) {
516 ret = PTR_ERR(sgt);
517 goto fail_detach;
518 }
519
520 gobj = drm_gem_shmem_prime_import_sg_table(dev, attach, sgt);
521 if (IS_ERR(gobj)) {
522 ret = PTR_ERR(gobj);
523 goto fail_unmap;
524 }
525
526 abo = to_xdna_obj(gobj);
527 abo->attach = attach;
528 abo->dma_buf = dma_buf;
529
530 return gobj;
531
532fail_unmap:
533 dma_buf_unmap_attachment_unlocked(attach, sgt, DMA_BIDIRECTIONAL);
534fail_detach:
535 dma_buf_detach(dma_buf, attach);
536put_buf:
537 dma_buf_put(dma_buf);
538
539 return ERR_PTR(ret);
540}
541
542static struct amdxdna_gem_obj *
543amdxdna_drm_alloc_shmem(struct drm_device *dev,
544 struct amdxdna_drm_create_bo *args,
545 struct drm_file *filp)
546{
547 struct amdxdna_client *client = filp->driver_priv;
548 struct drm_gem_shmem_object *shmem;
549 struct amdxdna_gem_obj *abo;
550
551 shmem = drm_gem_shmem_create(dev, args->size);
552 if (IS_ERR(shmem))
553 return ERR_CAST(shmem);
554
555 shmem->map_wc = false;
556
557 abo = to_xdna_obj(&shmem->base);
558 abo->client = client;
559 abo->type = AMDXDNA_BO_SHMEM;
560
561 return abo;
562}
563
564static struct amdxdna_gem_obj *
565amdxdna_drm_create_dev_heap(struct drm_device *dev,
566 struct amdxdna_drm_create_bo *args,
567 struct drm_file *filp)
568{
569 struct amdxdna_client *client = filp->driver_priv;
570 struct iosys_map map = IOSYS_MAP_INIT_VADDR(NULL);
571 struct amdxdna_dev *xdna = to_xdna_dev(dev);
572 struct drm_gem_shmem_object *shmem;
573 struct amdxdna_gem_obj *abo;
574 int ret;
575
576 if (args->size > xdna->dev_info->dev_mem_size) {
577 XDNA_DBG(xdna, "Invalid dev heap size 0x%llx, limit 0x%lx",
578 args->size, xdna->dev_info->dev_mem_size);
579 return ERR_PTR(-EINVAL);
580 }
581
582 mutex_lock(&client->mm_lock);
583 if (client->dev_heap) {
584 XDNA_DBG(client->xdna, "dev heap is already created");
585 ret = -EBUSY;
586 goto mm_unlock;
587 }
588
589 shmem = drm_gem_shmem_create(dev, args->size);
590 if (IS_ERR(shmem)) {
591 ret = PTR_ERR(shmem);
592 goto mm_unlock;
593 }
594
595 shmem->map_wc = false;
596 abo = to_xdna_obj(&shmem->base);
597 abo->type = AMDXDNA_BO_DEV_HEAP;
598 abo->client = client;
599 abo->mem.dev_addr = client->xdna->dev_info->dev_mem_base;
600 drm_mm_init(&abo->mm, abo->mem.dev_addr, abo->mem.size);
601
602 ret = drm_gem_vmap(to_gobj(abo), &map);
603 if (ret) {
604 XDNA_ERR(xdna, "Vmap heap bo failed, ret %d", ret);
605 goto release_obj;
606 }
607 abo->mem.kva = map.vaddr;
608
609 client->dev_heap = abo;
610 drm_gem_object_get(to_gobj(abo));
611 mutex_unlock(&client->mm_lock);
612
613 return abo;
614
615release_obj:
616 drm_gem_object_put(to_gobj(abo));
617mm_unlock:
618 mutex_unlock(&client->mm_lock);
619 return ERR_PTR(ret);
620}
621
622struct amdxdna_gem_obj *
623amdxdna_drm_alloc_dev_bo(struct drm_device *dev,
624 struct amdxdna_drm_create_bo *args,
625 struct drm_file *filp)
626{
627 struct amdxdna_client *client = filp->driver_priv;
628 struct amdxdna_dev *xdna = to_xdna_dev(dev);
629 size_t aligned_sz = PAGE_ALIGN(args->size);
630 struct amdxdna_gem_obj *abo;
631 int ret;
632
633 abo = amdxdna_gem_create_obj(&xdna->ddev, aligned_sz);
634 if (IS_ERR(abo))
635 return abo;
636
637 to_gobj(abo)->funcs = &amdxdna_gem_dev_obj_funcs;
638 abo->type = AMDXDNA_BO_DEV;
639 abo->client = client;
640
641 ret = amdxdna_gem_heap_alloc(abo);
642 if (ret) {
643 XDNA_ERR(xdna, "Failed to alloc dev bo memory, ret %d", ret);
644 amdxdna_gem_destroy_obj(abo);
645 return ERR_PTR(ret);
646 }
647
648 drm_gem_private_object_init(&xdna->ddev, to_gobj(abo), aligned_sz);
649
650 return abo;
651}
652
653static struct amdxdna_gem_obj *
654amdxdna_drm_create_cmd_bo(struct drm_device *dev,
655 struct amdxdna_drm_create_bo *args,
656 struct drm_file *filp)
657{
658 struct iosys_map map = IOSYS_MAP_INIT_VADDR(NULL);
659 struct amdxdna_dev *xdna = to_xdna_dev(dev);
660 struct drm_gem_shmem_object *shmem;
661 struct amdxdna_gem_obj *abo;
662 int ret;
663
664 if (args->size > XDNA_MAX_CMD_BO_SIZE) {
665 XDNA_ERR(xdna, "Command bo size 0x%llx too large", args->size);
666 return ERR_PTR(-EINVAL);
667 }
668
669 if (args->size < sizeof(struct amdxdna_cmd)) {
670 XDNA_DBG(xdna, "Command BO size 0x%llx too small", args->size);
671 return ERR_PTR(-EINVAL);
672 }
673
674 shmem = drm_gem_shmem_create(dev, args->size);
675 if (IS_ERR(shmem))
676 return ERR_CAST(shmem);
677
678 shmem->map_wc = false;
679 abo = to_xdna_obj(&shmem->base);
680
681 abo->type = AMDXDNA_BO_CMD;
682 abo->client = filp->driver_priv;
683
684 ret = drm_gem_vmap(to_gobj(abo), &map);
685 if (ret) {
686 XDNA_ERR(xdna, "Vmap cmd bo failed, ret %d", ret);
687 goto release_obj;
688 }
689 abo->mem.kva = map.vaddr;
690
691 return abo;
692
693release_obj:
694 drm_gem_shmem_free(shmem);
695 return ERR_PTR(ret);
696}
697
698int amdxdna_drm_create_bo_ioctl(struct drm_device *dev, void *data, struct drm_file *filp)
699{
700 struct amdxdna_dev *xdna = to_xdna_dev(dev);
701 struct amdxdna_drm_create_bo *args = data;
702 struct amdxdna_gem_obj *abo;
703 int ret;
704
705 if (args->flags || args->vaddr || !args->size)
706 return -EINVAL;
707
708 XDNA_DBG(xdna, "BO arg type %d vaddr 0x%llx size 0x%llx flags 0x%llx",
709 args->type, args->vaddr, args->size, args->flags);
710 switch (args->type) {
711 case AMDXDNA_BO_SHMEM:
712 abo = amdxdna_drm_alloc_shmem(dev, args, filp);
713 break;
714 case AMDXDNA_BO_DEV_HEAP:
715 abo = amdxdna_drm_create_dev_heap(dev, args, filp);
716 break;
717 case AMDXDNA_BO_DEV:
718 abo = amdxdna_drm_alloc_dev_bo(dev, args, filp);
719 break;
720 case AMDXDNA_BO_CMD:
721 abo = amdxdna_drm_create_cmd_bo(dev, args, filp);
722 break;
723 default:
724 return -EINVAL;
725 }
726 if (IS_ERR(abo))
727 return PTR_ERR(abo);
728
729 /* ready to publish object to userspace */
730 ret = drm_gem_handle_create(filp, to_gobj(abo), &args->handle);
731 if (ret) {
732 XDNA_ERR(xdna, "Create handle failed");
733 goto put_obj;
734 }
735
736 XDNA_DBG(xdna, "BO hdl %d type %d userptr 0x%llx xdna_addr 0x%llx size 0x%lx",
737 args->handle, args->type, abo->mem.userptr,
738 abo->mem.dev_addr, abo->mem.size);
739put_obj:
740 /* Dereference object reference. Handle holds it now. */
741 drm_gem_object_put(to_gobj(abo));
742 return ret;
743}
744
745int amdxdna_gem_pin_nolock(struct amdxdna_gem_obj *abo)
746{
747 struct amdxdna_dev *xdna = to_xdna_dev(to_gobj(abo)->dev);
748 int ret;
749
750 if (abo->type == AMDXDNA_BO_DEV)
751 abo = abo->client->dev_heap;
752
753 if (is_import_bo(abo))
754 return 0;
755
756 ret = drm_gem_shmem_pin(&abo->base);
757
758 XDNA_DBG(xdna, "BO type %d ret %d", abo->type, ret);
759 return ret;
760}
761
762int amdxdna_gem_pin(struct amdxdna_gem_obj *abo)
763{
764 int ret;
765
766 mutex_lock(&abo->lock);
767 ret = amdxdna_gem_pin_nolock(abo);
768 mutex_unlock(&abo->lock);
769
770 return ret;
771}
772
773void amdxdna_gem_unpin(struct amdxdna_gem_obj *abo)
774{
775 if (abo->type == AMDXDNA_BO_DEV)
776 abo = abo->client->dev_heap;
777
778 if (is_import_bo(abo))
779 return;
780
781 mutex_lock(&abo->lock);
782 drm_gem_shmem_unpin(&abo->base);
783 mutex_unlock(&abo->lock);
784}
785
786struct amdxdna_gem_obj *amdxdna_gem_get_obj(struct amdxdna_client *client,
787 u32 bo_hdl, u8 bo_type)
788{
789 struct amdxdna_dev *xdna = client->xdna;
790 struct amdxdna_gem_obj *abo;
791 struct drm_gem_object *gobj;
792
793 gobj = drm_gem_object_lookup(client->filp, bo_hdl);
794 if (!gobj) {
795 XDNA_DBG(xdna, "Can not find bo %d", bo_hdl);
796 return NULL;
797 }
798
799 abo = to_xdna_obj(gobj);
800 if (bo_type == AMDXDNA_BO_INVALID || abo->type == bo_type)
801 return abo;
802
803 drm_gem_object_put(gobj);
804 return NULL;
805}
806
807int amdxdna_drm_get_bo_info_ioctl(struct drm_device *dev, void *data, struct drm_file *filp)
808{
809 struct amdxdna_drm_get_bo_info *args = data;
810 struct amdxdna_dev *xdna = to_xdna_dev(dev);
811 struct amdxdna_gem_obj *abo;
812 struct drm_gem_object *gobj;
813 int ret = 0;
814
815 if (args->ext || args->ext_flags || args->pad)
816 return -EINVAL;
817
818 gobj = drm_gem_object_lookup(filp, args->handle);
819 if (!gobj) {
820 XDNA_DBG(xdna, "Lookup GEM object %d failed", args->handle);
821 return -ENOENT;
822 }
823
824 abo = to_xdna_obj(gobj);
825 args->vaddr = abo->mem.userptr;
826 args->xdna_addr = abo->mem.dev_addr;
827
828 if (abo->type != AMDXDNA_BO_DEV)
829 args->map_offset = drm_vma_node_offset_addr(&gobj->vma_node);
830 else
831 args->map_offset = AMDXDNA_INVALID_ADDR;
832
833 XDNA_DBG(xdna, "BO hdl %d map_offset 0x%llx vaddr 0x%llx xdna_addr 0x%llx",
834 args->handle, args->map_offset, args->vaddr, args->xdna_addr);
835
836 drm_gem_object_put(gobj);
837 return ret;
838}
839
840/*
841 * The sync bo ioctl is to make sure the CPU cache is in sync with memory.
842 * This is required because NPU is not cache coherent device. CPU cache
843 * flushing/invalidation is expensive so it is best to handle this outside
844 * of the command submission path. This ioctl allows explicit cache
845 * flushing/invalidation outside of the critical path.
846 */
847int amdxdna_drm_sync_bo_ioctl(struct drm_device *dev,
848 void *data, struct drm_file *filp)
849{
850 struct amdxdna_dev *xdna = to_xdna_dev(dev);
851 struct amdxdna_drm_sync_bo *args = data;
852 struct amdxdna_gem_obj *abo;
853 struct drm_gem_object *gobj;
854 int ret;
855
856 gobj = drm_gem_object_lookup(filp, args->handle);
857 if (!gobj) {
858 XDNA_ERR(xdna, "Lookup GEM object failed");
859 return -ENOENT;
860 }
861 abo = to_xdna_obj(gobj);
862
863 ret = amdxdna_gem_pin(abo);
864 if (ret) {
865 XDNA_ERR(xdna, "Pin BO %d failed, ret %d", args->handle, ret);
866 goto put_obj;
867 }
868
869 if (is_import_bo(abo))
870 drm_clflush_sg(abo->base.sgt);
871 else if (abo->mem.kva)
872 drm_clflush_virt_range(abo->mem.kva + args->offset, args->size);
873 else if (abo->base.pages)
874 drm_clflush_pages(abo->base.pages, gobj->size >> PAGE_SHIFT);
875 else
876 drm_WARN(&xdna->ddev, 1, "Can not get flush memory");
877
878 amdxdna_gem_unpin(abo);
879
880 XDNA_DBG(xdna, "Sync bo %d offset 0x%llx, size 0x%llx\n",
881 args->handle, args->offset, args->size);
882
883put_obj:
884 drm_gem_object_put(gobj);
885 return ret;
886}