brcm2708: rename target to bcm27xx
[openwrt/staging/mkresin.git] / target / linux / bcm27xx / patches-4.19 / 950-0548-staging-vc-sm-cma-Add-in-allocation-for-VPU-requests.patch
1 From 275f4673d8c0601e5dbb16e743187d264e7dbed6 Mon Sep 17 00:00:00 2001
2 From: Dave Stevenson <dave.stevenson@raspberrypi.org>
3 Date: Fri, 21 Dec 2018 16:50:53 +0000
4 Subject: [PATCH] staging: vc-sm-cma: Add in allocation for VPU
5 requests.
6
7 Module has to change from tristate to bool as all CMA functions
8 are boolean.
9
10 Signed-off-by: Dave Stevenson <dave.stevenson@raspberrypi.org>
11 ---
12 .../staging/vc04_services/vc-sm-cma/Kconfig | 4 +-
13 .../staging/vc04_services/vc-sm-cma/Makefile | 2 +-
14 .../staging/vc04_services/vc-sm-cma/vc_sm.c | 642 +++++++++++++++---
15 .../staging/vc04_services/vc-sm-cma/vc_sm.h | 30 +-
16 .../vc04_services/vc-sm-cma/vc_sm_cma.c | 99 +++
17 .../vc04_services/vc-sm-cma/vc_sm_cma.h | 39 ++
18 .../vc04_services/vc-sm-cma/vc_sm_cma_vchi.c | 10 +
19 .../vc04_services/vc-sm-cma/vc_sm_cma_vchi.h | 4 +
20 .../vc04_services/vc-sm-cma/vc_sm_defs.h | 2 +
21 9 files changed, 723 insertions(+), 109 deletions(-)
22 create mode 100644 drivers/staging/vc04_services/vc-sm-cma/vc_sm_cma.c
23 create mode 100644 drivers/staging/vc04_services/vc-sm-cma/vc_sm_cma.h
24
25 --- a/drivers/staging/vc04_services/vc-sm-cma/Kconfig
26 +++ b/drivers/staging/vc04_services/vc-sm-cma/Kconfig
27 @@ -1,6 +1,6 @@
28 config BCM_VC_SM_CMA
29 - tristate "VideoCore Shared Memory (CMA) driver"
30 - depends on BCM2835_VCHIQ
31 + bool "VideoCore Shared Memory (CMA) driver"
32 + depends on BCM2835_VCHIQ && DMA_CMA
33 select RBTREE
34 select DMA_SHARED_BUFFER
35 help
36 --- a/drivers/staging/vc04_services/vc-sm-cma/Makefile
37 +++ b/drivers/staging/vc04_services/vc-sm-cma/Makefile
38 @@ -3,6 +3,6 @@ ccflags-y += -Idrivers/staging/vc04_serv
39 ccflags-y += -D__VCCOREVER__=0
40
41 vc-sm-cma-$(CONFIG_BCM_VC_SM_CMA) := \
42 - vc_sm.o vc_sm_cma_vchi.o
43 + vc_sm.o vc_sm_cma_vchi.o vc_sm_cma.o
44
45 obj-$(CONFIG_BCM_VC_SM_CMA) += vc-sm-cma.o
46 --- a/drivers/staging/vc04_services/vc-sm-cma/vc_sm.c
47 +++ b/drivers/staging/vc04_services/vc-sm-cma/vc_sm.c
48 @@ -9,10 +9,21 @@
49 * and taking some code for CMA/dmabuf handling from the Android Ion
50 * driver (Google/Linaro).
51 *
52 - * This is cut down version to only support import of dma_bufs from
53 - * other kernel drivers. A more complete implementation of the old
54 - * vmcs_sm functionality can follow later.
55 *
56 + * This driver has 3 main uses:
57 + * 1) Allocating buffers for the kernel or userspace that can be shared with the
58 + * VPU.
59 + * 2) Importing dmabufs from elsewhere for sharing with the VPU.
60 + * 3) Allocating buffers for use by the VPU.
61 + *
62 + * In the first and second cases the native handle is a dmabuf. Releasing the
63 + * resource inherently comes from releasing the dmabuf, and this will trigger
64 + * unmapping on the VPU. The underlying allocation and our buffer structure are
65 + * retained until the VPU has confirmed that it has finished with it.
66 + *
67 + * For the VPU allocations the VPU is responsible for triggering the release,
68 + * and therefore the released message decrements the dma_buf refcount (with the
69 + * VPU mapping having already been marked as released).
70 */
71
72 /* ---- Include Files ----------------------------------------------------- */
73 @@ -39,6 +50,7 @@
74 #include "vc_sm_cma_vchi.h"
75
76 #include "vc_sm.h"
77 +#include "vc_sm_cma.h"
78 #include "vc_sm_knl.h"
79
80 /* ---- Private Constants and Types --------------------------------------- */
81 @@ -72,6 +84,7 @@ struct sm_state_t {
82 struct platform_device *pdev;
83
84 struct sm_instance *sm_handle; /* Handle for videocore service. */
85 + struct cma *cma_heap;
86
87 spinlock_t kernelid_map_lock; /* Spinlock protecting kernelid_map */
88 struct idr kernelid_map;
89 @@ -80,6 +93,7 @@ struct sm_state_t {
90 struct list_head buffer_list; /* List of buffer. */
91
92 struct vc_sm_privdata_t *data_knl; /* Kernel internal data tracking. */
93 + struct vc_sm_privdata_t *vpu_allocs; /* All allocations from the VPU */
94 struct dentry *dir_root; /* Debug fs entries root. */
95 struct sm_pde_t dir_state; /* Debug fs entries state sub-tree. */
96
97 @@ -89,6 +103,12 @@ struct sm_state_t {
98 u32 int_trans_id; /* Interrupted transaction. */
99 };
100
101 +struct vc_sm_dma_buf_attachment {
102 + struct device *dev;
103 + struct sg_table *table;
104 + struct list_head list;
105 +};
106 +
107 /* ---- Private Variables ----------------------------------------------- */
108
109 static struct sm_state_t *sm_state;
110 @@ -172,12 +192,14 @@ static int vc_sm_cma_global_state_show(s
111 resource->size);
112 seq_printf(s, " DMABUF %p\n",
113 resource->dma_buf);
114 - seq_printf(s, " ATTACH %p\n",
115 - resource->attach);
116 + if (resource->imported) {
117 + seq_printf(s, " ATTACH %p\n",
118 + resource->import.attach);
119 + seq_printf(s, " SGT %p\n",
120 + resource->import.sgt);
121 + }
122 seq_printf(s, " SG_TABLE %p\n",
123 resource->sg_table);
124 - seq_printf(s, " SGT %p\n",
125 - resource->sgt);
126 seq_printf(s, " DMA_ADDR %pad\n",
127 &resource->dma_addr);
128 seq_printf(s, " VC_HANDLE %08x\n",
129 @@ -209,17 +231,33 @@ static void vc_sm_add_resource(struct vc
130 }
131
132 /*
133 - * Release an allocation.
134 - * All refcounting is done via the dma buf object.
135 + * Cleans up imported dmabuf.
136 */
137 -static void vc_sm_release_resource(struct vc_sm_buffer *buffer, int force)
138 +static void vc_sm_clean_up_dmabuf(struct vc_sm_buffer *buffer)
139 {
140 - mutex_lock(&sm_state->map_lock);
141 - mutex_lock(&buffer->lock);
142 + if (!buffer->imported)
143 + return;
144
145 - pr_debug("[%s]: buffer %p (name %s, size %zu)\n",
146 - __func__, buffer, buffer->name, buffer->size);
147 + /* Handle cleaning up imported dmabufs */
148 + mutex_lock(&buffer->lock);
149 + if (buffer->import.sgt) {
150 + dma_buf_unmap_attachment(buffer->import.attach,
151 + buffer->import.sgt,
152 + DMA_BIDIRECTIONAL);
153 + buffer->import.sgt = NULL;
154 + }
155 + if (buffer->import.attach) {
156 + dma_buf_detach(buffer->dma_buf, buffer->import.attach);
157 + buffer->import.attach = NULL;
158 + }
159 + mutex_unlock(&buffer->lock);
160 +}
161
162 +/*
163 + * Instructs VPU to decrement the refcount on a buffer.
164 + */
165 +static void vc_sm_vpu_free(struct vc_sm_buffer *buffer)
166 +{
167 if (buffer->vc_handle && buffer->vpu_state == VPU_MAPPED) {
168 struct vc_sm_free_t free = { buffer->vc_handle, 0 };
169 int status = vc_sm_cma_vchi_free(sm_state->sm_handle, &free,
170 @@ -230,17 +268,32 @@ static void vc_sm_release_resource(struc
171 }
172
173 if (sm_state->require_released_callback) {
174 - /* Need to wait for the VPU to confirm the free */
175 + /* Need to wait for the VPU to confirm the free. */
176
177 /* Retain a reference on this until the VPU has
178 * released it
179 */
180 buffer->vpu_state = VPU_UNMAPPING;
181 - goto defer;
182 + } else {
183 + buffer->vpu_state = VPU_NOT_MAPPED;
184 + buffer->vc_handle = 0;
185 }
186 - buffer->vpu_state = VPU_NOT_MAPPED;
187 - buffer->vc_handle = 0;
188 }
189 +}
190 +
191 +/*
192 + * Release an allocation.
193 + * All refcounting is done via the dma buf object.
194 + *
195 + * Must be called with the mutex held. The function will either release the
196 + * mutex (if defering the release) or destroy it. The caller must therefore not
197 + * reuse the buffer on return.
198 + */
199 +static void vc_sm_release_resource(struct vc_sm_buffer *buffer)
200 +{
201 + pr_debug("[%s]: buffer %p (name %s, size %zu)\n",
202 + __func__, buffer, buffer->name, buffer->size);
203 +
204 if (buffer->vc_handle) {
205 /* We've sent the unmap request but not had the response. */
206 pr_err("[%s]: Waiting for VPU unmap response on %p\n",
207 @@ -248,45 +301,43 @@ static void vc_sm_release_resource(struc
208 goto defer;
209 }
210 if (buffer->in_use) {
211 - /* Don't release dmabuf here - we await the release */
212 + /* dmabuf still in use - we await the release */
213 pr_err("[%s]: buffer %p is still in use\n",
214 __func__, buffer);
215 goto defer;
216 }
217
218 - /* Handle cleaning up imported dmabufs */
219 - if (buffer->sgt) {
220 - dma_buf_unmap_attachment(buffer->attach, buffer->sgt,
221 - DMA_BIDIRECTIONAL);
222 - buffer->sgt = NULL;
223 - }
224 - if (buffer->attach) {
225 - dma_buf_detach(buffer->dma_buf, buffer->attach);
226 - buffer->attach = NULL;
227 - }
228 -
229 - /* Release the dma_buf (whether ours or imported) */
230 - if (buffer->import_dma_buf) {
231 - dma_buf_put(buffer->import_dma_buf);
232 - buffer->import_dma_buf = NULL;
233 - buffer->dma_buf = NULL;
234 - } else if (buffer->dma_buf) {
235 - dma_buf_put(buffer->dma_buf);
236 - buffer->dma_buf = NULL;
237 + /* Release the allocation (whether imported dmabuf or CMA allocation) */
238 + if (buffer->imported) {
239 + pr_debug("%s: Release imported dmabuf %p\n", __func__,
240 + buffer->import.dma_buf);
241 + if (buffer->import.dma_buf)
242 + dma_buf_put(buffer->import.dma_buf);
243 + else
244 + pr_err("%s: Imported dmabuf already been put for buf %p\n",
245 + __func__, buffer);
246 + buffer->import.dma_buf = NULL;
247 + } else {
248 + if (buffer->sg_table) {
249 + /* Our own allocation that we need to dma_unmap_sg */
250 + dma_unmap_sg(&sm_state->pdev->dev,
251 + buffer->sg_table->sgl,
252 + buffer->sg_table->nents,
253 + DMA_BIDIRECTIONAL);
254 + }
255 + pr_debug("%s: Release our allocation\n", __func__);
256 + vc_sm_cma_buffer_free(&buffer->alloc);
257 + pr_debug("%s: Release our allocation - done\n", __func__);
258 }
259
260 - if (buffer->sg_table && !buffer->import_dma_buf) {
261 - /* Our own allocation that we need to dma_unmap_sg */
262 - dma_unmap_sg(&sm_state->pdev->dev, buffer->sg_table->sgl,
263 - buffer->sg_table->nents, DMA_BIDIRECTIONAL);
264 - }
265
266 - /* Free the local resource. Start by removing it from the list */
267 - buffer->private = NULL;
268 + /* Free our buffer. Start by removing it from the list */
269 + mutex_lock(&sm_state->map_lock);
270 list_del(&buffer->global_buffer_list);
271 + mutex_unlock(&sm_state->map_lock);
272
273 + pr_debug("%s: Release our allocation - done\n", __func__);
274 mutex_unlock(&buffer->lock);
275 - mutex_unlock(&sm_state->map_lock);
276
277 mutex_destroy(&buffer->lock);
278
279 @@ -295,7 +346,7 @@ static void vc_sm_release_resource(struc
280
281 defer:
282 mutex_unlock(&buffer->lock);
283 - mutex_unlock(&sm_state->map_lock);
284 + return;
285 }
286
287 /* Create support for private data tracking. */
288 @@ -317,16 +368,267 @@ static struct vc_sm_privdata_t *vc_sm_cm
289 return file_data;
290 }
291
292 +static struct sg_table *dup_sg_table(struct sg_table *table)
293 +{
294 + struct sg_table *new_table;
295 + int ret, i;
296 + struct scatterlist *sg, *new_sg;
297 +
298 + new_table = kzalloc(sizeof(*new_table), GFP_KERNEL);
299 + if (!new_table)
300 + return ERR_PTR(-ENOMEM);
301 +
302 + ret = sg_alloc_table(new_table, table->nents, GFP_KERNEL);
303 + if (ret) {
304 + kfree(new_table);
305 + return ERR_PTR(-ENOMEM);
306 + }
307 +
308 + new_sg = new_table->sgl;
309 + for_each_sg(table->sgl, sg, table->nents, i) {
310 + memcpy(new_sg, sg, sizeof(*sg));
311 + sg->dma_address = 0;
312 + new_sg = sg_next(new_sg);
313 + }
314 +
315 + return new_table;
316 +}
317 +
318 +static void free_duped_table(struct sg_table *table)
319 +{
320 + sg_free_table(table);
321 + kfree(table);
322 +}
323 +
324 +/* Dma buf operations for use with our own allocations */
325 +
326 +static int vc_sm_dma_buf_attach(struct dma_buf *dmabuf,
327 + struct dma_buf_attachment *attachment)
328 +
329 +{
330 + struct vc_sm_dma_buf_attachment *a;
331 + struct sg_table *table;
332 + struct vc_sm_buffer *buf = dmabuf->priv;
333 +
334 + a = kzalloc(sizeof(*a), GFP_KERNEL);
335 + if (!a)
336 + return -ENOMEM;
337 +
338 + table = dup_sg_table(buf->sg_table);
339 + if (IS_ERR(table)) {
340 + kfree(a);
341 + return -ENOMEM;
342 + }
343 +
344 + a->table = table;
345 + INIT_LIST_HEAD(&a->list);
346 +
347 + attachment->priv = a;
348 +
349 + mutex_lock(&buf->lock);
350 + list_add(&a->list, &buf->attachments);
351 + mutex_unlock(&buf->lock);
352 + pr_debug("%s dmabuf %p attachment %p\n", __func__, dmabuf, attachment);
353 +
354 + return 0;
355 +}
356 +
357 +static void vc_sm_dma_buf_detatch(struct dma_buf *dmabuf,
358 + struct dma_buf_attachment *attachment)
359 +{
360 + struct vc_sm_dma_buf_attachment *a = attachment->priv;
361 + struct vc_sm_buffer *buf = dmabuf->priv;
362 +
363 + pr_debug("%s dmabuf %p attachment %p\n", __func__, dmabuf, attachment);
364 + free_duped_table(a->table);
365 + mutex_lock(&buf->lock);
366 + list_del(&a->list);
367 + mutex_unlock(&buf->lock);
368 +
369 + kfree(a);
370 +}
371 +
372 +static struct sg_table *vc_sm_map_dma_buf(struct dma_buf_attachment *attachment,
373 + enum dma_data_direction direction)
374 +{
375 + struct vc_sm_dma_buf_attachment *a = attachment->priv;
376 + struct sg_table *table;
377 +
378 + table = a->table;
379 +
380 + if (!dma_map_sg(attachment->dev, table->sgl, table->nents,
381 + direction))
382 + return ERR_PTR(-ENOMEM);
383 +
384 + pr_debug("%s attachment %p\n", __func__, attachment);
385 + return table;
386 +}
387 +
388 +static void vc_sm_unmap_dma_buf(struct dma_buf_attachment *attachment,
389 + struct sg_table *table,
390 + enum dma_data_direction direction)
391 +{
392 + pr_debug("%s attachment %p\n", __func__, attachment);
393 + dma_unmap_sg(attachment->dev, table->sgl, table->nents, direction);
394 +}
395 +
396 +static int vc_sm_dmabuf_mmap(struct dma_buf *dmabuf, struct vm_area_struct *vma)
397 +{
398 + struct vc_sm_buffer *buf = dmabuf->priv;
399 + struct sg_table *table = buf->sg_table;
400 + unsigned long addr = vma->vm_start;
401 + unsigned long offset = vma->vm_pgoff * PAGE_SIZE;
402 + struct scatterlist *sg;
403 + int i;
404 + int ret = 0;
405 +
406 + pr_debug("%s dmabuf %p, buf %p, vm_start %08lX\n", __func__, dmabuf,
407 + buf, addr);
408 +
409 + mutex_lock(&buf->lock);
410 +
411 + /* now map it to userspace */
412 + for_each_sg(table->sgl, sg, table->nents, i) {
413 + struct page *page = sg_page(sg);
414 + unsigned long remainder = vma->vm_end - addr;
415 + unsigned long len = sg->length;
416 +
417 + if (offset >= sg->length) {
418 + offset -= sg->length;
419 + continue;
420 + } else if (offset) {
421 + page += offset / PAGE_SIZE;
422 + len = sg->length - offset;
423 + offset = 0;
424 + }
425 + len = min(len, remainder);
426 + ret = remap_pfn_range(vma, addr, page_to_pfn(page), len,
427 + vma->vm_page_prot);
428 + if (ret)
429 + break;
430 + addr += len;
431 + if (addr >= vma->vm_end)
432 + break;
433 + }
434 + mutex_unlock(&buf->lock);
435 +
436 + if (ret)
437 + pr_err("%s: failure mapping buffer to userspace\n",
438 + __func__);
439 +
440 + return ret;
441 +}
442 +
443 +static void vc_sm_dma_buf_release(struct dma_buf *dmabuf)
444 +{
445 + struct vc_sm_buffer *buffer;
446 +
447 + if (!dmabuf)
448 + return;
449 +
450 + buffer = (struct vc_sm_buffer *)dmabuf->priv;
451 +
452 + mutex_lock(&buffer->lock);
453 +
454 + pr_debug("%s dmabuf %p, buffer %p\n", __func__, dmabuf, buffer);
455 +
456 + buffer->in_use = 0;
457 +
458 + /* Unmap on the VPU */
459 + vc_sm_vpu_free(buffer);
460 + pr_debug("%s vpu_free done\n", __func__);
461 +
462 + /* Unmap our dma_buf object (the vc_sm_buffer remains until released
463 + * on the VPU).
464 + */
465 + vc_sm_clean_up_dmabuf(buffer);
466 + pr_debug("%s clean_up dmabuf done\n", __func__);
467 +
468 + vc_sm_release_resource(buffer);
469 + pr_debug("%s done\n", __func__);
470 +}
471 +
472 +static int vc_sm_dma_buf_begin_cpu_access(struct dma_buf *dmabuf,
473 + enum dma_data_direction direction)
474 +{
475 + struct vc_sm_buffer *buf;
476 + struct vc_sm_dma_buf_attachment *a;
477 +
478 + if (!dmabuf)
479 + return -EFAULT;
480 +
481 + buf = dmabuf->priv;
482 + if (!buf)
483 + return -EFAULT;
484 +
485 + mutex_lock(&buf->lock);
486 +
487 + list_for_each_entry(a, &buf->attachments, list) {
488 + dma_sync_sg_for_cpu(a->dev, a->table->sgl, a->table->nents,
489 + direction);
490 + }
491 + mutex_unlock(&buf->lock);
492 +
493 + return 0;
494 +}
495 +
496 +static int vc_sm_dma_buf_end_cpu_access(struct dma_buf *dmabuf,
497 + enum dma_data_direction direction)
498 +{
499 + struct vc_sm_buffer *buf;
500 + struct vc_sm_dma_buf_attachment *a;
501 +
502 + if (!dmabuf)
503 + return -EFAULT;
504 + buf = dmabuf->priv;
505 + if (!buf)
506 + return -EFAULT;
507 +
508 + mutex_lock(&buf->lock);
509 +
510 + list_for_each_entry(a, &buf->attachments, list) {
511 + dma_sync_sg_for_device(a->dev, a->table->sgl, a->table->nents,
512 + direction);
513 + }
514 + mutex_unlock(&buf->lock);
515 +
516 + return 0;
517 +}
518 +
519 +static void *vc_sm_dma_buf_kmap(struct dma_buf *dmabuf, unsigned long offset)
520 +{
521 + /* FIXME */
522 + return NULL;
523 +}
524 +
525 +static void vc_sm_dma_buf_kunmap(struct dma_buf *dmabuf, unsigned long offset,
526 + void *ptr)
527 +{
528 + /* FIXME */
529 +}
530 +
531 +static const struct dma_buf_ops dma_buf_ops = {
532 + .map_dma_buf = vc_sm_map_dma_buf,
533 + .unmap_dma_buf = vc_sm_unmap_dma_buf,
534 + .mmap = vc_sm_dmabuf_mmap,
535 + .release = vc_sm_dma_buf_release,
536 + .attach = vc_sm_dma_buf_attach,
537 + .detach = vc_sm_dma_buf_detatch,
538 + .begin_cpu_access = vc_sm_dma_buf_begin_cpu_access,
539 + .end_cpu_access = vc_sm_dma_buf_end_cpu_access,
540 + .map = vc_sm_dma_buf_kmap,
541 + .unmap = vc_sm_dma_buf_kunmap,
542 +};
543 /* Dma_buf operations for chaining through to an imported dma_buf */
544 static
545 int vc_sm_import_dma_buf_attach(struct dma_buf *dmabuf,
546 struct dma_buf_attachment *attachment)
547 {
548 - struct vc_sm_buffer *res = dmabuf->priv;
549 + struct vc_sm_buffer *buf = dmabuf->priv;
550
551 - if (!res->import_dma_buf)
552 + if (!buf->imported)
553 return -EINVAL;
554 - return res->import_dma_buf->ops->attach(res->import_dma_buf,
555 + return buf->import.dma_buf->ops->attach(buf->import.dma_buf,
556 attachment);
557 }
558
559 @@ -334,22 +636,23 @@ static
560 void vc_sm_import_dma_buf_detatch(struct dma_buf *dmabuf,
561 struct dma_buf_attachment *attachment)
562 {
563 - struct vc_sm_buffer *res = dmabuf->priv;
564 + struct vc_sm_buffer *buf = dmabuf->priv;
565
566 - if (!res->import_dma_buf)
567 + if (!buf->imported)
568 return;
569 - res->import_dma_buf->ops->detach(res->import_dma_buf, attachment);
570 + buf->import.dma_buf->ops->detach(buf->import.dma_buf, attachment);
571 }
572
573 static
574 struct sg_table *vc_sm_import_map_dma_buf(struct dma_buf_attachment *attachment,
575 enum dma_data_direction direction)
576 {
577 - struct vc_sm_buffer *res = attachment->dmabuf->priv;
578 + struct vc_sm_buffer *buf = attachment->dmabuf->priv;
579
580 - if (!res->import_dma_buf)
581 + if (!buf->imported)
582 return NULL;
583 - return res->import_dma_buf->ops->map_dma_buf(attachment, direction);
584 + return buf->import.dma_buf->ops->map_dma_buf(attachment,
585 + direction);
586 }
587
588 static
589 @@ -357,87 +660,88 @@ void vc_sm_import_unmap_dma_buf(struct d
590 struct sg_table *table,
591 enum dma_data_direction direction)
592 {
593 - struct vc_sm_buffer *res = attachment->dmabuf->priv;
594 + struct vc_sm_buffer *buf = attachment->dmabuf->priv;
595
596 - if (!res->import_dma_buf)
597 + if (!buf->imported)
598 return;
599 - res->import_dma_buf->ops->unmap_dma_buf(attachment, table, direction);
600 + buf->import.dma_buf->ops->unmap_dma_buf(attachment, table, direction);
601 }
602
603 static
604 int vc_sm_import_dmabuf_mmap(struct dma_buf *dmabuf, struct vm_area_struct *vma)
605 {
606 - struct vc_sm_buffer *res = dmabuf->priv;
607 + struct vc_sm_buffer *buf = dmabuf->priv;
608
609 - pr_debug("%s: mmap dma_buf %p, res %p, imported db %p\n", __func__,
610 - dmabuf, res, res->import_dma_buf);
611 - if (!res->import_dma_buf) {
612 + pr_debug("%s: mmap dma_buf %p, buf %p, imported db %p\n", __func__,
613 + dmabuf, buf, buf->import.dma_buf);
614 + if (!buf->imported) {
615 pr_err("%s: mmap dma_buf %p- not an imported buffer\n",
616 __func__, dmabuf);
617 return -EINVAL;
618 }
619 - return res->import_dma_buf->ops->mmap(res->import_dma_buf, vma);
620 + return buf->import.dma_buf->ops->mmap(buf->import.dma_buf, vma);
621 }
622
623 static
624 void vc_sm_import_dma_buf_release(struct dma_buf *dmabuf)
625 {
626 - struct vc_sm_buffer *res = dmabuf->priv;
627 + struct vc_sm_buffer *buf = dmabuf->priv;
628
629 pr_debug("%s: Relasing dma_buf %p\n", __func__, dmabuf);
630 - if (!res->import_dma_buf)
631 + mutex_lock(&buf->lock);
632 + if (!buf->imported)
633 return;
634
635 - res->in_use = 0;
636 + buf->in_use = 0;
637
638 - vc_sm_release_resource(res, 0);
639 + vc_sm_vpu_free(buf);
640 +
641 + vc_sm_release_resource(buf);
642 }
643
644 static
645 void *vc_sm_import_dma_buf_kmap(struct dma_buf *dmabuf,
646 unsigned long offset)
647 {
648 - struct vc_sm_buffer *res = dmabuf->priv;
649 + struct vc_sm_buffer *buf = dmabuf->priv;
650
651 - if (!res->import_dma_buf)
652 + if (!buf->imported)
653 return NULL;
654 - return res->import_dma_buf->ops->map(res->import_dma_buf,
655 - offset);
656 + return buf->import.dma_buf->ops->map(buf->import.dma_buf, offset);
657 }
658
659 static
660 void vc_sm_import_dma_buf_kunmap(struct dma_buf *dmabuf,
661 unsigned long offset, void *ptr)
662 {
663 - struct vc_sm_buffer *res = dmabuf->priv;
664 + struct vc_sm_buffer *buf = dmabuf->priv;
665
666 - if (!res->import_dma_buf)
667 + if (!buf->imported)
668 return;
669 - res->import_dma_buf->ops->unmap(res->import_dma_buf,
670 - offset, ptr);
671 + buf->import.dma_buf->ops->unmap(buf->import.dma_buf, offset, ptr);
672 }
673
674 static
675 int vc_sm_import_dma_buf_begin_cpu_access(struct dma_buf *dmabuf,
676 enum dma_data_direction direction)
677 {
678 - struct vc_sm_buffer *res = dmabuf->priv;
679 + struct vc_sm_buffer *buf = dmabuf->priv;
680
681 - if (!res->import_dma_buf)
682 + if (!buf->imported)
683 return -EINVAL;
684 - return res->import_dma_buf->ops->begin_cpu_access(res->import_dma_buf,
685 - direction);
686 + return buf->import.dma_buf->ops->begin_cpu_access(buf->import.dma_buf,
687 + direction);
688 }
689
690 static
691 int vc_sm_import_dma_buf_end_cpu_access(struct dma_buf *dmabuf,
692 enum dma_data_direction direction)
693 {
694 - struct vc_sm_buffer *res = dmabuf->priv;
695 + struct vc_sm_buffer *buf = dmabuf->priv;
696
697 - if (!res->import_dma_buf)
698 + if (!buf->imported)
699 return -EINVAL;
700 - return res->import_dma_buf->ops->end_cpu_access(res->import_dma_buf,
701 + return buf->import.dma_buf->ops->end_cpu_access(buf->import.dma_buf,
702 direction);
703 }
704
705 @@ -516,9 +820,8 @@ vc_sm_cma_import_dmabuf_internal(struct
706 memcpy(import.name, VC_SM_RESOURCE_NAME_DEFAULT,
707 sizeof(VC_SM_RESOURCE_NAME_DEFAULT));
708
709 - pr_debug("[%s]: attempt to import \"%s\" data - type %u, addr %pad, size %u\n",
710 - __func__, import.name, import.type, &dma_addr,
711 - import.size);
712 + pr_debug("[%s]: attempt to import \"%s\" data - type %u, addr %pad, size %u.\n",
713 + __func__, import.name, import.type, &dma_addr, import.size);
714
715 /* Allocate the videocore buffer. */
716 status = vc_sm_cma_vchi_import(sm_state->sm_handle, &import, &result,
717 @@ -548,12 +851,14 @@ vc_sm_cma_import_dmabuf_internal(struct
718 buffer->size = import.size;
719 buffer->vpu_state = VPU_MAPPED;
720
721 - buffer->import_dma_buf = dma_buf;
722 + buffer->imported = 1;
723 + buffer->import.dma_buf = dma_buf;
724
725 - buffer->attach = attach;
726 - buffer->sgt = sgt;
727 + buffer->import.attach = attach;
728 + buffer->import.sgt = sgt;
729 buffer->dma_addr = dma_addr;
730 buffer->in_use = 1;
731 + buffer->kernel_id = import.kernel_id;
732
733 /*
734 * We're done - we need to export a new dmabuf chaining through most
735 @@ -594,6 +899,91 @@ error:
736 return ret;
737 }
738
739 +static int vc_sm_cma_vpu_alloc(u32 size, uint32_t align, const char *name,
740 + u32 mem_handle, struct vc_sm_buffer **ret_buffer)
741 +{
742 + DEFINE_DMA_BUF_EXPORT_INFO(exp_info);
743 + struct vc_sm_buffer *buffer = NULL;
744 + int aligned_size;
745 + int ret = 0;
746 +
747 + /* Align to the user requested align */
748 + aligned_size = ALIGN(size, align);
749 + /* and then to a page boundary */
750 + aligned_size = PAGE_ALIGN(aligned_size);
751 +
752 + if (!aligned_size)
753 + return -EINVAL;
754 +
755 + /* Allocate local buffer to track this allocation. */
756 + buffer = kzalloc(sizeof(*buffer), GFP_KERNEL);
757 + if (!buffer)
758 + return -ENOMEM;
759 +
760 + mutex_init(&buffer->lock);
761 +
762 + if (vc_sm_cma_buffer_allocate(sm_state->cma_heap, &buffer->alloc,
763 + aligned_size)) {
764 + pr_err("[%s]: cma alloc of %d bytes failed\n",
765 + __func__, aligned_size);
766 + ret = -ENOMEM;
767 + goto error;
768 + }
769 + buffer->sg_table = buffer->alloc.sg_table;
770 +
771 + pr_debug("[%s]: cma alloc of %d bytes success\n",
772 + __func__, aligned_size);
773 +
774 + if (dma_map_sg(&sm_state->pdev->dev, buffer->sg_table->sgl,
775 + buffer->sg_table->nents, DMA_BIDIRECTIONAL) <= 0) {
776 + pr_err("[%s]: dma_map_sg failed\n", __func__);
777 + goto error;
778 + }
779 +
780 + INIT_LIST_HEAD(&buffer->attachments);
781 +
782 + memcpy(buffer->name, name,
783 + min(sizeof(buffer->name), strlen(name)));
784 +
785 + exp_info.ops = &dma_buf_ops;
786 + exp_info.size = aligned_size;
787 + exp_info.flags = O_RDWR;
788 + exp_info.priv = buffer;
789 +
790 + buffer->dma_buf = dma_buf_export(&exp_info);
791 + if (IS_ERR(buffer->dma_buf)) {
792 + ret = PTR_ERR(buffer->dma_buf);
793 + goto error;
794 + }
795 + buffer->dma_addr = (uint32_t)sg_dma_address(buffer->sg_table->sgl);
796 + if ((buffer->dma_addr & 0xC0000000) != 0xC0000000) {
797 + pr_err("%s: Expecting an uncached alias for dma_addr %pad\n",
798 + __func__, &buffer->dma_addr);
799 + buffer->dma_addr |= 0xC0000000;
800 + }
801 + buffer->private = sm_state->vpu_allocs;
802 +
803 + buffer->vc_handle = mem_handle;
804 + buffer->vpu_state = VPU_MAPPED;
805 + buffer->vpu_allocated = 1;
806 + buffer->size = size;
807 + /*
808 + * Create an ID that will be passed along with our message so
809 + * that when we service the release reply, we can look up which
810 + * resource is being released.
811 + */
812 + buffer->kernel_id = get_kernel_id(buffer);
813 +
814 + vc_sm_add_resource(sm_state->vpu_allocs, buffer);
815 +
816 + *ret_buffer = buffer;
817 + return 0;
818 +error:
819 + if (buffer)
820 + vc_sm_release_resource(buffer);
821 + return ret;
822 +}
823 +
824 static void
825 vc_sm_vpu_event(struct sm_instance *instance, struct vc_sm_result_t *reply,
826 int reply_len)
827 @@ -612,21 +1002,61 @@ vc_sm_vpu_event(struct sm_instance *inst
828 struct vc_sm_released *release = (struct vc_sm_released *)reply;
829 struct vc_sm_buffer *buffer =
830 lookup_kernel_id(release->kernel_id);
831 + if (!buffer) {
832 + pr_err("%s: VC released a buffer that is already released, kernel_id %d\n",
833 + __func__, release->kernel_id);
834 + break;
835 + }
836 + mutex_lock(&buffer->lock);
837
838 - /*
839 - * FIXME: Need to check buffer is still valid and allocated
840 - * before continuing
841 - */
842 pr_debug("%s: Released addr %08x, size %u, id %08x, mem_handle %08x\n",
843 __func__, release->addr, release->size,
844 release->kernel_id, release->vc_handle);
845 - mutex_lock(&buffer->lock);
846 +
847 buffer->vc_handle = 0;
848 buffer->vpu_state = VPU_NOT_MAPPED;
849 - mutex_unlock(&buffer->lock);
850 free_kernel_id(release->kernel_id);
851
852 - vc_sm_release_resource(buffer, 0);
853 + if (buffer->vpu_allocated) {
854 + /* VPU allocation, so release the dmabuf which will
855 + * trigger the clean up.
856 + */
857 + mutex_unlock(&buffer->lock);
858 + dma_buf_put(buffer->dma_buf);
859 + } else {
860 + vc_sm_release_resource(buffer);
861 + }
862 + }
863 + break;
864 + case VC_SM_MSG_TYPE_VC_MEM_REQUEST:
865 + {
866 + struct vc_sm_buffer *buffer = NULL;
867 + struct vc_sm_vc_mem_request *req =
868 + (struct vc_sm_vc_mem_request *)reply;
869 + struct vc_sm_vc_mem_request_result reply;
870 + int ret;
871 +
872 + pr_debug("%s: Request %u bytes of memory, align %d name %s, trans_id %08x\n",
873 + __func__, req->size, req->align, req->name,
874 + req->trans_id);
875 + ret = vc_sm_cma_vpu_alloc(req->size, req->align, req->name,
876 + req->vc_handle, &buffer);
877 +
878 + reply.trans_id = req->trans_id;
879 + if (!ret) {
880 + reply.addr = buffer->dma_addr;
881 + reply.kernel_id = buffer->kernel_id;
882 + pr_debug("%s: Allocated resource buffer %p, addr %pad\n",
883 + __func__, buffer, &buffer->dma_addr);
884 + } else {
885 + pr_err("%s: Allocation failed size %u, name %s, vc_handle %u\n",
886 + __func__, req->size, req->name, req->vc_handle);
887 + reply.addr = 0;
888 + reply.kernel_id = 0;
889 + }
890 + vc_sm_vchi_client_vc_mem_req_reply(sm_state->sm_handle, &reply,
891 + &sm_state->int_trans_id);
892 + break;
893 }
894 break;
895 default:
896 @@ -645,6 +1075,14 @@ static void vc_sm_connected_init(void)
897
898 pr_info("[%s]: start\n", __func__);
899
900 + if (vc_sm_cma_add_heaps(&sm_state->cma_heap) ||
901 + !sm_state->cma_heap) {
902 + pr_err("[%s]: failed to initialise CMA heaps\n",
903 + __func__);
904 + ret = -EIO;
905 + goto err_free_mem;
906 + }
907 +
908 /*
909 * Initialize and create a VCHI connection for the shared memory service
910 * running on videocore.
911 @@ -696,7 +1134,7 @@ static void vc_sm_connected_init(void)
912 goto err_remove_shared_memory;
913 }
914
915 - version.version = 1;
916 + version.version = 2;
917 ret = vc_sm_cma_vchi_client_version(sm_state->sm_handle, &version,
918 &version_result,
919 &sm_state->int_trans_id);
920 @@ -768,7 +1206,7 @@ static int bcm2835_vc_sm_cma_remove(stru
921 int vc_sm_cma_int_handle(void *handle)
922 {
923 struct dma_buf *dma_buf = (struct dma_buf *)handle;
924 - struct vc_sm_buffer *res;
925 + struct vc_sm_buffer *buf;
926
927 /* Validate we can work with this device. */
928 if (!sm_state || !handle) {
929 @@ -776,8 +1214,8 @@ int vc_sm_cma_int_handle(void *handle)
930 return 0;
931 }
932
933 - res = (struct vc_sm_buffer *)dma_buf->priv;
934 - return res->vc_handle;
935 + buf = (struct vc_sm_buffer *)dma_buf->priv;
936 + return buf->vc_handle;
937 }
938 EXPORT_SYMBOL_GPL(vc_sm_cma_int_handle);
939
940 @@ -804,7 +1242,7 @@ EXPORT_SYMBOL_GPL(vc_sm_cma_free);
941 int vc_sm_cma_import_dmabuf(struct dma_buf *src_dmabuf, void **handle)
942 {
943 struct dma_buf *new_dma_buf;
944 - struct vc_sm_buffer *res;
945 + struct vc_sm_buffer *buf;
946 int ret;
947
948 /* Validate we can work with this device. */
949 @@ -818,7 +1256,7 @@ int vc_sm_cma_import_dmabuf(struct dma_b
950
951 if (!ret) {
952 pr_debug("%s: imported to ptr %p\n", __func__, new_dma_buf);
953 - res = (struct vc_sm_buffer *)new_dma_buf->priv;
954 + buf = (struct vc_sm_buffer *)new_dma_buf->priv;
955
956 /* Assign valid handle at this time.*/
957 *handle = new_dma_buf;
958 --- a/drivers/staging/vc04_services/vc-sm-cma/vc_sm.h
959 +++ b/drivers/staging/vc04_services/vc-sm-cma/vc_sm.h
960 @@ -21,6 +21,8 @@
961 #include <linux/types.h>
962 #include <linux/miscdevice.h>
963
964 +#include "vc_sm_cma.h"
965 +
966 #define VC_SM_MAX_NAME_LEN 32
967
968 enum vc_sm_vpu_mapping_state {
969 @@ -29,31 +31,51 @@ enum vc_sm_vpu_mapping_state {
970 VPU_UNMAPPING
971 };
972
973 +struct vc_sm_imported {
974 + struct dma_buf *dma_buf;
975 + struct dma_buf_attachment *attach;
976 + struct sg_table *sgt;
977 +};
978 +
979 struct vc_sm_buffer {
980 struct list_head global_buffer_list; /* Global list of buffers. */
981
982 + /* Index in the kernel_id idr so that we can find the
983 + * mmal_msg_context again when servicing the VCHI reply.
984 + */
985 + int kernel_id;
986 +
987 size_t size;
988
989 /* Lock over all the following state for this buffer */
990 struct mutex lock;
991 - struct sg_table *sg_table;
992 struct list_head attachments;
993
994 char name[VC_SM_MAX_NAME_LEN];
995
996 int in_use:1; /* Kernel is still using this resource */
997 + int imported:1; /* Imported dmabuf */
998 +
999 + struct sg_table *sg_table;
1000
1001 enum vc_sm_vpu_mapping_state vpu_state;
1002 u32 vc_handle; /* VideoCore handle for this buffer */
1003 + int vpu_allocated; /*
1004 + * The VPU made this allocation. Release the
1005 + * local dma_buf when the VPU releases the
1006 + * resource.
1007 + */
1008
1009 /* DMABUF related fields */
1010 - struct dma_buf *import_dma_buf;
1011 struct dma_buf *dma_buf;
1012 - struct dma_buf_attachment *attach;
1013 - struct sg_table *sgt;
1014 dma_addr_t dma_addr;
1015
1016 struct vc_sm_privdata_t *private;
1017 +
1018 + union {
1019 + struct vc_sm_cma_alloc_data alloc;
1020 + struct vc_sm_imported import;
1021 + };
1022 };
1023
1024 #endif
1025 --- /dev/null
1026 +++ b/drivers/staging/vc04_services/vc-sm-cma/vc_sm_cma.c
1027 @@ -0,0 +1,99 @@
1028 +// SPDX-License-Identifier: GPL-2.0
1029 +/*
1030 + * VideoCore Shared Memory CMA allocator
1031 + *
1032 + * Copyright: 2018, Raspberry Pi (Trading) Ltd
1033 + *
1034 + * Based on the Android ION allocator
1035 + * Copyright (C) Linaro 2012
1036 + * Author: <benjamin.gaignard@linaro.org> for ST-Ericsson.
1037 + *
1038 + */
1039 +
1040 +#include <linux/slab.h>
1041 +#include <linux/errno.h>
1042 +#include <linux/err.h>
1043 +#include <linux/cma.h>
1044 +#include <linux/scatterlist.h>
1045 +
1046 +#include "vc_sm_cma.h"
1047 +
1048 +/* CMA heap operations functions */
1049 +int vc_sm_cma_buffer_allocate(struct cma *cma_heap,
1050 + struct vc_sm_cma_alloc_data *buffer,
1051 + unsigned long len)
1052 +{
1053 + /* len should already be page aligned */
1054 + unsigned long num_pages = len / PAGE_SIZE;
1055 + struct sg_table *table;
1056 + struct page *pages;
1057 + int ret;
1058 +
1059 + pages = cma_alloc(cma_heap, num_pages, 0, GFP_KERNEL);
1060 + if (!pages)
1061 + return -ENOMEM;
1062 +
1063 + table = kmalloc(sizeof(*table), GFP_KERNEL);
1064 + if (!table)
1065 + goto err;
1066 +
1067 + ret = sg_alloc_table(table, 1, GFP_KERNEL);
1068 + if (ret)
1069 + goto free_mem;
1070 +
1071 + sg_set_page(table->sgl, pages, len, 0);
1072 +
1073 + buffer->priv_virt = pages;
1074 + buffer->sg_table = table;
1075 + buffer->cma_heap = cma_heap;
1076 + buffer->num_pages = num_pages;
1077 + return 0;
1078 +
1079 +free_mem:
1080 + kfree(table);
1081 +err:
1082 + cma_release(cma_heap, pages, num_pages);
1083 + return -ENOMEM;
1084 +}
1085 +
1086 +void vc_sm_cma_buffer_free(struct vc_sm_cma_alloc_data *buffer)
1087 +{
1088 + struct cma *cma_heap = buffer->cma_heap;
1089 + struct page *pages = buffer->priv_virt;
1090 +
1091 + /* release memory */
1092 + if (cma_heap)
1093 + cma_release(cma_heap, pages, buffer->num_pages);
1094 +
1095 + /* release sg table */
1096 + if (buffer->sg_table) {
1097 + sg_free_table(buffer->sg_table);
1098 + kfree(buffer->sg_table);
1099 + buffer->sg_table = NULL;
1100 + }
1101 +}
1102 +
1103 +int __vc_sm_cma_add_heaps(struct cma *cma, void *priv)
1104 +{
1105 + struct cma **heap = (struct cma **)priv;
1106 + const char *name = cma_get_name(cma);
1107 +
1108 + if (!(*heap)) {
1109 + phys_addr_t phys_addr = cma_get_base(cma);
1110 +
1111 + pr_debug("%s: Adding cma heap %s (start %pap, size %lu) for use by vcsm\n",
1112 + __func__, name, &phys_addr, cma_get_size(cma));
1113 + *heap = cma;
1114 + } else {
1115 + pr_err("%s: Ignoring heap %s as already set\n",
1116 + __func__, name);
1117 + }
1118 +
1119 + return 0;
1120 +}
1121 +
1122 +int vc_sm_cma_add_heaps(struct cma **cma_heap)
1123 +{
1124 + cma_for_each_area(__vc_sm_cma_add_heaps, cma_heap);
1125 + return 0;
1126 +}
1127 --- /dev/null
1128 +++ b/drivers/staging/vc04_services/vc-sm-cma/vc_sm_cma.h
1129 @@ -0,0 +1,39 @@
1130 +/* SPDX-License-Identifier: GPL-2.0 */
1131 +
1132 +/*
1133 + * VideoCore Shared Memory CMA allocator
1134 + *
1135 + * Copyright: 2018, Raspberry Pi (Trading) Ltd
1136 + *
1137 + * Based on the Android ION allocator
1138 + * Copyright (C) Linaro 2012
1139 + * Author: <benjamin.gaignard@linaro.org> for ST-Ericsson.
1140 + *
1141 + * This software is licensed under the terms of the GNU General Public
1142 + * License version 2, as published by the Free Software Foundation, and
1143 + * may be copied, distributed, and modified under those terms.
1144 + *
1145 + * This program is distributed in the hope that it will be useful,
1146 + * but WITHOUT ANY WARRANTY; without even the implied warranty of
1147 + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
1148 + * GNU General Public License for more details.
1149 + *
1150 + */
1151 +#ifndef VC_SM_CMA_H
1152 +#define VC_SM_CMA_H
1153 +
1154 +struct vc_sm_cma_alloc_data {
1155 + struct cma *cma_heap;
1156 + unsigned long num_pages;
1157 + void *priv_virt;
1158 + struct sg_table *sg_table;
1159 +};
1160 +
1161 +int vc_sm_cma_buffer_allocate(struct cma *cma_heap,
1162 + struct vc_sm_cma_alloc_data *buffer,
1163 + unsigned long len);
1164 +void vc_sm_cma_buffer_free(struct vc_sm_cma_alloc_data *buffer);
1165 +
1166 +int vc_sm_cma_add_heaps(struct cma **cma_heap);
1167 +
1168 +#endif
1169 --- a/drivers/staging/vc04_services/vc-sm-cma/vc_sm_cma_vchi.c
1170 +++ b/drivers/staging/vc04_services/vc-sm-cma/vc_sm_cma_vchi.c
1171 @@ -500,3 +500,13 @@ int vc_sm_cma_vchi_client_version(struct
1172 msg, sizeof(*msg), NULL, 0,
1173 cur_trans_id, 0);
1174 }
1175 +
1176 +int vc_sm_vchi_client_vc_mem_req_reply(struct sm_instance *handle,
1177 + struct vc_sm_vc_mem_request_result *msg,
1178 + uint32_t *cur_trans_id)
1179 +{
1180 + return vc_sm_cma_vchi_send_msg(handle,
1181 + VC_SM_MSG_TYPE_VC_MEM_REQUEST_REPLY,
1182 + msg, sizeof(*msg), 0, 0, cur_trans_id,
1183 + 0);
1184 +}
1185 --- a/drivers/staging/vc04_services/vc-sm-cma/vc_sm_cma_vchi.h
1186 +++ b/drivers/staging/vc04_services/vc-sm-cma/vc_sm_cma_vchi.h
1187 @@ -56,4 +56,8 @@ int vc_sm_cma_vchi_client_version(struct
1188 struct vc_sm_result_t *result,
1189 u32 *cur_trans_id);
1190
1191 +int vc_sm_vchi_client_vc_mem_req_reply(struct sm_instance *handle,
1192 + struct vc_sm_vc_mem_request_result *msg,
1193 + uint32_t *cur_trans_id);
1194 +
1195 #endif /* __VC_SM_CMA_VCHI_H__INCLUDED__ */
1196 --- a/drivers/staging/vc04_services/vc-sm-cma/vc_sm_defs.h
1197 +++ b/drivers/staging/vc04_services/vc-sm-cma/vc_sm_defs.h
1198 @@ -264,6 +264,8 @@ struct vc_sm_vc_mem_request {
1199 u32 align;
1200 /* resource name (for easier tracking) */
1201 char name[VC_SM_RESOURCE_NAME];
1202 + /* VPU handle for the resource */
1203 + u32 vc_handle;
1204 };
1205
1206 /* Response from the kernel to provide the VPU with some memory */