1 // SPDX-License-Identifier: GPL-2.0
3 // Copyright (c) 2018 MediaTek Inc.
5 #include <linux/bitops.h>
7 #include <linux/clk-provider.h>
8 #include <linux/dma-mapping.h>
9 #include <linux/errno.h>
10 #include <linux/interrupt.h>
12 #include <linux/iopoll.h>
13 #include <linux/kernel.h>
14 #include <linux/module.h>
15 #include <linux/platform_device.h>
16 #include <linux/mailbox_controller.h>
17 #include <linux/mailbox/mtk-cmdq-mailbox.h>
18 #include <linux/of_device.h>
20 #define CMDQ_OP_CODE_MASK (0xff << CMDQ_OP_CODE_SHIFT)
21 #define CMDQ_NUM_CMD(t) (t->cmd_buf_size / CMDQ_INST_SIZE)
22 #define CMDQ_GCE_NUM_MAX (2)
24 #define CMDQ_CURR_IRQ_STATUS 0x10
25 #define CMDQ_SYNC_TOKEN_UPDATE 0x68
26 #define CMDQ_THR_SLOT_CYCLES 0x30
27 #define CMDQ_THR_BASE 0x100
28 #define CMDQ_THR_SIZE 0x80
29 #define CMDQ_THR_WARM_RESET 0x00
30 #define CMDQ_THR_ENABLE_TASK 0x04
31 #define CMDQ_THR_SUSPEND_TASK 0x08
32 #define CMDQ_THR_CURR_STATUS 0x0c
33 #define CMDQ_THR_IRQ_STATUS 0x10
34 #define CMDQ_THR_IRQ_ENABLE 0x14
35 #define CMDQ_THR_CURR_ADDR 0x20
36 #define CMDQ_THR_END_ADDR 0x24
37 #define CMDQ_THR_WAIT_TOKEN 0x30
38 #define CMDQ_THR_PRIORITY 0x40
40 #define GCE_GCTL_VALUE 0x48
42 #define CMDQ_THR_ACTIVE_SLOT_CYCLES 0x3200
43 #define CMDQ_THR_ENABLED 0x1
44 #define CMDQ_THR_DISABLED 0x0
45 #define CMDQ_THR_SUSPEND 0x1
46 #define CMDQ_THR_RESUME 0x0
47 #define CMDQ_THR_STATUS_SUSPENDED BIT(1)
48 #define CMDQ_THR_DO_WARM_RESET BIT(0)
49 #define CMDQ_THR_IRQ_DONE 0x1
50 #define CMDQ_THR_IRQ_ERROR 0x12
51 #define CMDQ_THR_IRQ_EN (CMDQ_THR_IRQ_ERROR | CMDQ_THR_IRQ_DONE)
52 #define CMDQ_THR_IS_WAITING BIT(31)
54 #define CMDQ_JUMP_BY_OFFSET 0x10000000
55 #define CMDQ_JUMP_BY_PA 0x10000001
58 struct mbox_chan *chan;
60 struct list_head task_busy_list;
66 struct list_head list_entry;
68 struct cmdq_thread *thread;
69 struct cmdq_pkt *pkt; /* the packet sent from mailbox client */
73 struct mbox_controller mbox;
78 struct cmdq_thread *thread;
79 struct clk_bulk_data clocks[CMDQ_GCE_NUM_MAX];
93 u8 cmdq_get_shift_pa(struct mbox_chan *chan)
95 struct cmdq *cmdq = container_of(chan->mbox, struct cmdq, mbox);
97 return cmdq->shift_pa;
99 EXPORT_SYMBOL(cmdq_get_shift_pa);
101 static int cmdq_thread_suspend(struct cmdq *cmdq, struct cmdq_thread *thread)
105 writel(CMDQ_THR_SUSPEND, thread->base + CMDQ_THR_SUSPEND_TASK);
107 /* If already disabled, treat as suspended successful. */
108 if (!(readl(thread->base + CMDQ_THR_ENABLE_TASK) & CMDQ_THR_ENABLED))
111 if (readl_poll_timeout_atomic(thread->base + CMDQ_THR_CURR_STATUS,
112 status, status & CMDQ_THR_STATUS_SUSPENDED, 0, 10)) {
113 dev_err(cmdq->mbox.dev, "suspend GCE thread 0x%x failed\n",
114 (u32)(thread->base - cmdq->base));
121 static void cmdq_thread_resume(struct cmdq_thread *thread)
123 writel(CMDQ_THR_RESUME, thread->base + CMDQ_THR_SUSPEND_TASK);
126 static void cmdq_init(struct cmdq *cmdq)
130 WARN_ON(clk_bulk_enable(cmdq->gce_num, cmdq->clocks));
131 if (cmdq->control_by_sw)
132 writel(0x7, cmdq->base + GCE_GCTL_VALUE);
133 writel(CMDQ_THR_ACTIVE_SLOT_CYCLES, cmdq->base + CMDQ_THR_SLOT_CYCLES);
134 for (i = 0; i <= CMDQ_MAX_EVENT; i++)
135 writel(i, cmdq->base + CMDQ_SYNC_TOKEN_UPDATE);
136 clk_bulk_disable(cmdq->gce_num, cmdq->clocks);
139 static int cmdq_thread_reset(struct cmdq *cmdq, struct cmdq_thread *thread)
143 writel(CMDQ_THR_DO_WARM_RESET, thread->base + CMDQ_THR_WARM_RESET);
144 if (readl_poll_timeout_atomic(thread->base + CMDQ_THR_WARM_RESET,
145 warm_reset, !(warm_reset & CMDQ_THR_DO_WARM_RESET),
147 dev_err(cmdq->mbox.dev, "reset GCE thread 0x%x failed\n",
148 (u32)(thread->base - cmdq->base));
155 static void cmdq_thread_disable(struct cmdq *cmdq, struct cmdq_thread *thread)
157 cmdq_thread_reset(cmdq, thread);
158 writel(CMDQ_THR_DISABLED, thread->base + CMDQ_THR_ENABLE_TASK);
161 /* notify GCE to re-fetch commands by setting GCE thread PC */
162 static void cmdq_thread_invalidate_fetched_data(struct cmdq_thread *thread)
164 writel(readl(thread->base + CMDQ_THR_CURR_ADDR),
165 thread->base + CMDQ_THR_CURR_ADDR);
168 static void cmdq_task_insert_into_thread(struct cmdq_task *task)
170 struct device *dev = task->cmdq->mbox.dev;
171 struct cmdq_thread *thread = task->thread;
172 struct cmdq_task *prev_task = list_last_entry(
173 &thread->task_busy_list, typeof(*task), list_entry);
174 u64 *prev_task_base = prev_task->pkt->va_base;
176 /* let previous task jump to this task */
177 dma_sync_single_for_cpu(dev, prev_task->pa_base,
178 prev_task->pkt->cmd_buf_size, DMA_TO_DEVICE);
179 prev_task_base[CMDQ_NUM_CMD(prev_task->pkt) - 1] =
180 (u64)CMDQ_JUMP_BY_PA << 32 |
181 (task->pa_base >> task->cmdq->shift_pa);
182 dma_sync_single_for_device(dev, prev_task->pa_base,
183 prev_task->pkt->cmd_buf_size, DMA_TO_DEVICE);
185 cmdq_thread_invalidate_fetched_data(thread);
188 static bool cmdq_thread_is_in_wfe(struct cmdq_thread *thread)
190 return readl(thread->base + CMDQ_THR_WAIT_TOKEN) & CMDQ_THR_IS_WAITING;
193 static void cmdq_task_exec_done(struct cmdq_task *task, int sta)
195 struct cmdq_task_cb *cb = &task->pkt->async_cb;
196 struct cmdq_cb_data data;
198 WARN_ON(cb->cb == (cmdq_async_flush_cb)NULL);
200 data.data = cb->data;
201 data.pkt = task->pkt;
205 mbox_chan_received_data(task->thread->chan, &data);
207 list_del(&task->list_entry);
210 static void cmdq_task_handle_error(struct cmdq_task *task)
212 struct cmdq_thread *thread = task->thread;
213 struct cmdq_task *next_task;
214 struct cmdq *cmdq = task->cmdq;
216 dev_err(cmdq->mbox.dev, "task 0x%p error\n", task);
217 WARN_ON(cmdq_thread_suspend(cmdq, thread) < 0);
218 next_task = list_first_entry_or_null(&thread->task_busy_list,
219 struct cmdq_task, list_entry);
221 writel(next_task->pa_base >> cmdq->shift_pa,
222 thread->base + CMDQ_THR_CURR_ADDR);
223 cmdq_thread_resume(thread);
226 static void cmdq_thread_irq_handler(struct cmdq *cmdq,
227 struct cmdq_thread *thread)
229 struct cmdq_task *task, *tmp, *curr_task = NULL;
230 u32 curr_pa, irq_flag, task_end_pa;
233 irq_flag = readl(thread->base + CMDQ_THR_IRQ_STATUS);
234 writel(~irq_flag, thread->base + CMDQ_THR_IRQ_STATUS);
237 * When ISR call this function, another CPU core could run
238 * "release task" right before we acquire the spin lock, and thus
239 * reset / disable this GCE thread, so we need to check the enable
240 * bit of this GCE thread.
242 if (!(readl(thread->base + CMDQ_THR_ENABLE_TASK) & CMDQ_THR_ENABLED))
245 if (irq_flag & CMDQ_THR_IRQ_ERROR)
247 else if (irq_flag & CMDQ_THR_IRQ_DONE)
252 curr_pa = readl(thread->base + CMDQ_THR_CURR_ADDR) << cmdq->shift_pa;
254 list_for_each_entry_safe(task, tmp, &thread->task_busy_list,
256 task_end_pa = task->pa_base + task->pkt->cmd_buf_size;
257 if (curr_pa >= task->pa_base && curr_pa < task_end_pa)
260 if (!curr_task || curr_pa == task_end_pa - CMDQ_INST_SIZE) {
261 cmdq_task_exec_done(task, 0);
264 cmdq_task_exec_done(task, -ENOEXEC);
265 cmdq_task_handle_error(curr_task);
273 if (list_empty(&thread->task_busy_list)) {
274 cmdq_thread_disable(cmdq, thread);
275 clk_bulk_disable(cmdq->gce_num, cmdq->clocks);
279 static irqreturn_t cmdq_irq_handler(int irq, void *dev)
281 struct cmdq *cmdq = dev;
282 unsigned long irq_status, flags = 0L;
285 irq_status = readl(cmdq->base + CMDQ_CURR_IRQ_STATUS) & cmdq->irq_mask;
286 if (!(irq_status ^ cmdq->irq_mask))
289 for_each_clear_bit(bit, &irq_status, cmdq->thread_nr) {
290 struct cmdq_thread *thread = &cmdq->thread[bit];
292 spin_lock_irqsave(&thread->chan->lock, flags);
293 cmdq_thread_irq_handler(cmdq, thread);
294 spin_unlock_irqrestore(&thread->chan->lock, flags);
300 static int cmdq_suspend(struct device *dev)
302 struct cmdq *cmdq = dev_get_drvdata(dev);
303 struct cmdq_thread *thread;
305 bool task_running = false;
307 cmdq->suspended = true;
309 for (i = 0; i < cmdq->thread_nr; i++) {
310 thread = &cmdq->thread[i];
311 if (!list_empty(&thread->task_busy_list)) {
318 dev_warn(dev, "exist running task(s) in suspend\n");
320 clk_bulk_unprepare(cmdq->gce_num, cmdq->clocks);
325 static int cmdq_resume(struct device *dev)
327 struct cmdq *cmdq = dev_get_drvdata(dev);
329 WARN_ON(clk_bulk_prepare(cmdq->gce_num, cmdq->clocks));
330 cmdq->suspended = false;
334 static int cmdq_remove(struct platform_device *pdev)
336 struct cmdq *cmdq = platform_get_drvdata(pdev);
338 clk_bulk_unprepare(cmdq->gce_num, cmdq->clocks);
342 static int cmdq_mbox_send_data(struct mbox_chan *chan, void *data)
344 struct cmdq_pkt *pkt = (struct cmdq_pkt *)data;
345 struct cmdq_thread *thread = (struct cmdq_thread *)chan->con_priv;
346 struct cmdq *cmdq = dev_get_drvdata(chan->mbox->dev);
347 struct cmdq_task *task;
348 unsigned long curr_pa, end_pa;
350 /* Client should not flush new tasks if suspended. */
351 WARN_ON(cmdq->suspended);
353 task = kzalloc(sizeof(*task), GFP_ATOMIC);
358 INIT_LIST_HEAD(&task->list_entry);
359 task->pa_base = pkt->pa_base;
360 task->thread = thread;
363 if (list_empty(&thread->task_busy_list)) {
364 WARN_ON(clk_bulk_enable(cmdq->gce_num, cmdq->clocks));
367 * The thread reset will clear thread related register to 0,
368 * including pc, end, priority, irq, suspend and enable. Thus
369 * set CMDQ_THR_ENABLED to CMDQ_THR_ENABLE_TASK will enable
370 * thread and make it running.
372 WARN_ON(cmdq_thread_reset(cmdq, thread) < 0);
374 writel(task->pa_base >> cmdq->shift_pa,
375 thread->base + CMDQ_THR_CURR_ADDR);
376 writel((task->pa_base + pkt->cmd_buf_size) >> cmdq->shift_pa,
377 thread->base + CMDQ_THR_END_ADDR);
379 writel(thread->priority, thread->base + CMDQ_THR_PRIORITY);
380 writel(CMDQ_THR_IRQ_EN, thread->base + CMDQ_THR_IRQ_ENABLE);
381 writel(CMDQ_THR_ENABLED, thread->base + CMDQ_THR_ENABLE_TASK);
383 WARN_ON(cmdq_thread_suspend(cmdq, thread) < 0);
384 curr_pa = readl(thread->base + CMDQ_THR_CURR_ADDR) <<
386 end_pa = readl(thread->base + CMDQ_THR_END_ADDR) <<
389 if (curr_pa == end_pa - CMDQ_INST_SIZE ||
391 /* set to this task directly */
392 writel(task->pa_base >> cmdq->shift_pa,
393 thread->base + CMDQ_THR_CURR_ADDR);
395 cmdq_task_insert_into_thread(task);
396 smp_mb(); /* modify jump before enable thread */
398 writel((task->pa_base + pkt->cmd_buf_size) >> cmdq->shift_pa,
399 thread->base + CMDQ_THR_END_ADDR);
400 cmdq_thread_resume(thread);
402 list_move_tail(&task->list_entry, &thread->task_busy_list);
407 static int cmdq_mbox_startup(struct mbox_chan *chan)
412 static void cmdq_mbox_shutdown(struct mbox_chan *chan)
414 struct cmdq_thread *thread = (struct cmdq_thread *)chan->con_priv;
415 struct cmdq *cmdq = dev_get_drvdata(chan->mbox->dev);
416 struct cmdq_task *task, *tmp;
419 spin_lock_irqsave(&thread->chan->lock, flags);
420 if (list_empty(&thread->task_busy_list))
423 WARN_ON(cmdq_thread_suspend(cmdq, thread) < 0);
425 /* make sure executed tasks have success callback */
426 cmdq_thread_irq_handler(cmdq, thread);
427 if (list_empty(&thread->task_busy_list))
430 list_for_each_entry_safe(task, tmp, &thread->task_busy_list,
432 cmdq_task_exec_done(task, -ECONNABORTED);
436 cmdq_thread_disable(cmdq, thread);
437 clk_bulk_disable(cmdq->gce_num, cmdq->clocks);
441 * The thread->task_busy_list empty means thread already disable. The
442 * cmdq_mbox_send_data() always reset thread which clear disable and
443 * suspend statue when first pkt send to channel, so there is no need
444 * to do any operation here, only unlock and leave.
446 spin_unlock_irqrestore(&thread->chan->lock, flags);
449 static int cmdq_mbox_flush(struct mbox_chan *chan, unsigned long timeout)
451 struct cmdq_thread *thread = (struct cmdq_thread *)chan->con_priv;
452 struct cmdq_task_cb *cb;
453 struct cmdq_cb_data data;
454 struct cmdq *cmdq = dev_get_drvdata(chan->mbox->dev);
455 struct cmdq_task *task, *tmp;
459 spin_lock_irqsave(&thread->chan->lock, flags);
460 if (list_empty(&thread->task_busy_list))
463 WARN_ON(cmdq_thread_suspend(cmdq, thread) < 0);
464 if (!cmdq_thread_is_in_wfe(thread))
467 list_for_each_entry_safe(task, tmp, &thread->task_busy_list,
469 cb = &task->pkt->async_cb;
470 data.sta = -ECONNABORTED;
471 data.data = cb->data;
472 data.pkt = task->pkt;
476 mbox_chan_received_data(task->thread->chan, &data);
477 list_del(&task->list_entry);
481 cmdq_thread_resume(thread);
482 cmdq_thread_disable(cmdq, thread);
483 clk_bulk_disable(cmdq->gce_num, cmdq->clocks);
486 spin_unlock_irqrestore(&thread->chan->lock, flags);
490 cmdq_thread_resume(thread);
491 spin_unlock_irqrestore(&thread->chan->lock, flags);
492 if (readl_poll_timeout_atomic(thread->base + CMDQ_THR_ENABLE_TASK,
493 enable, enable == 0, 1, timeout)) {
494 dev_err(cmdq->mbox.dev, "Fail to wait GCE thread 0x%x done\n",
495 (u32)(thread->base - cmdq->base));
502 static const struct mbox_chan_ops cmdq_mbox_chan_ops = {
503 .send_data = cmdq_mbox_send_data,
504 .startup = cmdq_mbox_startup,
505 .shutdown = cmdq_mbox_shutdown,
506 .flush = cmdq_mbox_flush,
509 static struct mbox_chan *cmdq_xlate(struct mbox_controller *mbox,
510 const struct of_phandle_args *sp)
512 int ind = sp->args[0];
513 struct cmdq_thread *thread;
515 if (ind >= mbox->num_chans)
516 return ERR_PTR(-EINVAL);
518 thread = (struct cmdq_thread *)mbox->chans[ind].con_priv;
519 thread->priority = sp->args[1];
520 thread->chan = &mbox->chans[ind];
522 return &mbox->chans[ind];
525 static int cmdq_probe(struct platform_device *pdev)
527 struct device *dev = &pdev->dev;
528 struct resource *res;
531 struct gce_plat *plat_data;
532 struct device_node *phandle = dev->of_node;
533 struct device_node *node;
535 char clk_name[4] = "gce";
537 cmdq = devm_kzalloc(dev, sizeof(*cmdq), GFP_KERNEL);
541 res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
542 cmdq->base = devm_ioremap_resource(dev, res);
543 if (IS_ERR(cmdq->base))
544 return PTR_ERR(cmdq->base);
546 cmdq->irq = platform_get_irq(pdev, 0);
550 plat_data = (struct gce_plat *)of_device_get_match_data(dev);
552 dev_err(dev, "failed to get match data\n");
556 cmdq->thread_nr = plat_data->thread_nr;
557 cmdq->shift_pa = plat_data->shift;
558 cmdq->control_by_sw = plat_data->control_by_sw;
559 cmdq->gce_num = plat_data->gce_num;
560 cmdq->irq_mask = GENMASK(cmdq->thread_nr - 1, 0);
561 err = devm_request_irq(dev, cmdq->irq, cmdq_irq_handler, IRQF_SHARED,
564 dev_err(dev, "failed to register ISR (%d)\n", err);
568 dev_dbg(dev, "cmdq device: addr:0x%p, va:0x%p, irq:%d\n",
569 dev, cmdq->base, cmdq->irq);
571 if (cmdq->gce_num > 1) {
572 for_each_child_of_node(phandle->parent, node) {
575 alias_id = of_alias_get_id(node, clk_name);
576 if (alias_id < cmdq->gce_num) {
577 snprintf(clk_id, sizeof(clk_id), "%s%d", clk_name, alias_id);
578 cmdq->clocks[alias_id].id = clk_id;
579 cmdq->clocks[alias_id].clk = of_clk_get(node, 0);
580 if (IS_ERR(cmdq->clocks[alias_id].clk)) {
581 dev_err(dev, "failed to get gce clk: %d\n", alias_id);
582 return PTR_ERR(cmdq->clocks[alias_id].clk);
587 cmdq->clocks[alias_id].id = clk_name;
588 cmdq->clocks[alias_id].clk = devm_clk_get(&pdev->dev, clk_name);
589 if (IS_ERR(cmdq->clocks[alias_id].clk)) {
590 dev_err(dev, "failed to get gce clk\n");
591 return PTR_ERR(cmdq->clocks[alias_id].clk);
595 cmdq->mbox.dev = dev;
596 cmdq->mbox.chans = devm_kcalloc(dev, cmdq->thread_nr,
597 sizeof(*cmdq->mbox.chans), GFP_KERNEL);
598 if (!cmdq->mbox.chans)
601 cmdq->mbox.num_chans = cmdq->thread_nr;
602 cmdq->mbox.ops = &cmdq_mbox_chan_ops;
603 cmdq->mbox.of_xlate = cmdq_xlate;
605 /* make use of TXDONE_BY_ACK */
606 cmdq->mbox.txdone_irq = false;
607 cmdq->mbox.txdone_poll = false;
609 cmdq->thread = devm_kcalloc(dev, cmdq->thread_nr,
610 sizeof(*cmdq->thread), GFP_KERNEL);
614 for (i = 0; i < cmdq->thread_nr; i++) {
615 cmdq->thread[i].base = cmdq->base + CMDQ_THR_BASE +
617 INIT_LIST_HEAD(&cmdq->thread[i].task_busy_list);
618 cmdq->mbox.chans[i].con_priv = (void *)&cmdq->thread[i];
621 err = devm_mbox_controller_register(dev, &cmdq->mbox);
623 dev_err(dev, "failed to register mailbox: %d\n", err);
627 platform_set_drvdata(pdev, cmdq);
629 WARN_ON(clk_bulk_prepare(cmdq->gce_num, cmdq->clocks));
636 static const struct dev_pm_ops cmdq_pm_ops = {
637 .suspend = cmdq_suspend,
638 .resume = cmdq_resume,
641 static const struct gce_plat gce_plat_v2 = {
644 .control_by_sw = false,
648 static const struct gce_plat gce_plat_v3 = {
651 .control_by_sw = false,
655 static const struct gce_plat gce_plat_v4 = {
658 .control_by_sw = false,
662 static const struct gce_plat gce_plat_v5 = {
665 .control_by_sw = true,
669 static const struct gce_plat gce_plat_v6 = {
672 .control_by_sw = false,
676 static const struct of_device_id cmdq_of_ids[] = {
677 {.compatible = "mediatek,mt8173-gce", .data = (void *)&gce_plat_v2},
678 {.compatible = "mediatek,mt8183-gce", .data = (void *)&gce_plat_v3},
679 {.compatible = "mediatek,mt6779-gce", .data = (void *)&gce_plat_v4},
680 {.compatible = "mediatek,mt8192-gce", .data = (void *)&gce_plat_v5},
681 {.compatible = "mediatek,mt8195-gce", .data = (void *)&gce_plat_v6},
685 static struct platform_driver cmdq_drv = {
687 .remove = cmdq_remove,
691 .of_match_table = cmdq_of_ids,
695 static int __init cmdq_drv_init(void)
697 return platform_driver_register(&cmdq_drv);
700 static void __exit cmdq_drv_exit(void)
702 platform_driver_unregister(&cmdq_drv);
705 subsys_initcall(cmdq_drv_init);
706 module_exit(cmdq_drv_exit);
708 MODULE_LICENSE("GPL v2");