1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3 * Copyright (c) 2016 MediaTek Inc.
4 * Author: Andrew-CT Chen <andrew-ct.chen@mediatek.com>
5 */
6 #include <linux/clk.h>
7 #include <linux/debugfs.h>
8 #include <linux/firmware.h>
9 #include <linux/interrupt.h>
10 #include <linux/iommu.h>
11 #include <linux/module.h>
12 #include <linux/of_address.h>
13 #include <linux/of_irq.h>
14 #include <linux/of_platform.h>
15 #include <linux/of_reserved_mem.h>
16 #include <linux/sched.h>
17 #include <linux/sizes.h>
18 #include <linux/dma-mapping.h>
19
20 #include "mtk_vpu.h"
21
22 /*
23 * VPU (video processor unit) is a tiny processor controlling video hardware
24 * related to video codec, scaling and color format converting.
25 * VPU interfaces with other blocks by share memory and interrupt.
26 */
27
28 #define INIT_TIMEOUT_MS 2000U
29 #define IPI_TIMEOUT_MS 2000U
30 #define VPU_IDLE_TIMEOUT_MS 1000U
31 #define VPU_FW_VER_LEN 16
32
33 /* maximum program/data TCM (Tightly-Coupled Memory) size */
34 #define VPU_PTCM_SIZE (96 * SZ_1K)
35 #define VPU_DTCM_SIZE (32 * SZ_1K)
36 /* the offset to get data tcm address */
37 #define VPU_DTCM_OFFSET 0x18000UL
38 /* daynamic allocated maximum extended memory size */
39 #define VPU_EXT_P_SIZE SZ_1M
40 #define VPU_EXT_D_SIZE SZ_4M
41 /* maximum binary firmware size */
42 #define VPU_P_FW_SIZE (VPU_PTCM_SIZE + VPU_EXT_P_SIZE)
43 #define VPU_D_FW_SIZE (VPU_DTCM_SIZE + VPU_EXT_D_SIZE)
44 /* the size of share buffer between Host and VPU */
45 #define SHARE_BUF_SIZE 48
46
47 /* binary firmware name */
48 #define VPU_P_FW "vpu_p.bin"
49 #define VPU_D_FW "vpu_d.bin"
50 #define VPU_P_FW_NEW "mediatek/mt8173/vpu_p.bin"
51 #define VPU_D_FW_NEW "mediatek/mt8173/vpu_d.bin"
52
53 #define VPU_RESET 0x0
54 #define VPU_TCM_CFG 0x0008
55 #define VPU_PMEM_EXT0_ADDR 0x000C
56 #define VPU_PMEM_EXT1_ADDR 0x0010
57 #define VPU_TO_HOST 0x001C
58 #define VPU_DMEM_EXT0_ADDR 0x0014
59 #define VPU_DMEM_EXT1_ADDR 0x0018
60 #define HOST_TO_VPU 0x0024
61 #define VPU_IDLE_REG 0x002C
62 #define VPU_INT_STATUS 0x0034
63 #define VPU_PC_REG 0x0060
64 #define VPU_SP_REG 0x0064
65 #define VPU_RA_REG 0x0068
66 #define VPU_WDT_REG 0x0084
67
68 /* vpu inter-processor communication interrupt */
69 #define VPU_IPC_INT BIT(8)
70 /* vpu idle state */
71 #define VPU_IDLE_STATE BIT(23)
72
73 /**
74 * enum vpu_fw_type - VPU firmware type
75 *
76 * @P_FW: program firmware
77 * @D_FW: data firmware
78 *
79 */
80 enum vpu_fw_type {
81 P_FW,
82 D_FW,
83 };
84
85 /**
86 * struct vpu_mem - VPU extended program/data memory information
87 *
88 * @va: the kernel virtual memory address of VPU extended memory
89 * @pa: the physical memory address of VPU extended memory
90 *
91 */
92 struct vpu_mem {
93 void *va;
94 dma_addr_t pa;
95 };
96
97 /**
98 * struct vpu_regs - VPU TCM and configuration registers
99 *
100 * @tcm: the register for VPU Tightly-Coupled Memory
101 * @cfg: the register for VPU configuration
102 * @irq: the irq number for VPU interrupt
103 */
104 struct vpu_regs {
105 void __iomem *tcm;
106 void __iomem *cfg;
107 int irq;
108 };
109
110 /**
111 * struct vpu_wdt_handler - VPU watchdog reset handler
112 *
113 * @reset_func: reset handler
114 * @priv: private data
115 */
116 struct vpu_wdt_handler {
117 void (*reset_func)(void *);
118 void *priv;
119 };
120
121 /**
122 * struct vpu_wdt - VPU watchdog workqueue
123 *
124 * @handler: VPU watchdog reset handler
125 * @ws: workstruct for VPU watchdog
126 * @wq: workqueue for VPU watchdog
127 */
128 struct vpu_wdt {
129 struct vpu_wdt_handler handler[VPU_RST_MAX];
130 struct work_struct ws;
131 struct workqueue_struct *wq;
132 };
133
134 /**
135 * struct vpu_run - VPU initialization status
136 *
137 * @signaled: the signal of vpu initialization completed
138 * @fw_ver: VPU firmware version
139 * @dec_capability: decoder capability which is not used for now and
140 * the value is reserved for future use
141 * @enc_capability: encoder capability which is not used for now and
142 * the value is reserved for future use
143 * @wq: wait queue for VPU initialization status
144 */
145 struct vpu_run {
146 u32 signaled;
147 char fw_ver[VPU_FW_VER_LEN];
148 unsigned int dec_capability;
149 unsigned int enc_capability;
150 wait_queue_head_t wq;
151 };
152
153 /**
154 * struct vpu_ipi_desc - VPU IPI descriptor
155 *
156 * @handler: IPI handler
157 * @name: the name of IPI handler
158 * @priv: the private data of IPI handler
159 */
160 struct vpu_ipi_desc {
161 ipi_handler_t handler;
162 const char *name;
163 void *priv;
164 };
165
166 /**
167 * struct share_obj - DTCM (Data Tightly-Coupled Memory) buffer shared with
168 * AP and VPU
169 *
170 * @id: IPI id
171 * @len: share buffer length
172 * @share_buf: share buffer data
173 */
174 struct share_obj {
175 s32 id;
176 u32 len;
177 unsigned char share_buf[SHARE_BUF_SIZE];
178 };
179
180 /**
181 * struct mtk_vpu - vpu driver data
182 * @extmem: VPU extended memory information
183 * @reg: VPU TCM and configuration registers
184 * @run: VPU initialization status
185 * @wdt: VPU watchdog workqueue
186 * @ipi_desc: VPU IPI descriptor
187 * @recv_buf: VPU DTCM share buffer for receiving. The
188 * receive buffer is only accessed in interrupt context.
189 * @send_buf: VPU DTCM share buffer for sending
190 * @dev: VPU struct device
191 * @clk: VPU clock on/off
192 * @fw_loaded: indicate VPU firmware loaded
193 * @enable_4GB: VPU 4GB mode on/off
194 * @vpu_mutex: protect mtk_vpu (except recv_buf) and ensure only
195 * one client to use VPU service at a time. For example,
196 * suppose a client is using VPU to decode VP8.
197 * If the other client wants to encode VP8,
198 * it has to wait until VP8 decode completes.
199 * @wdt_refcnt: WDT reference count to make sure the watchdog can be
200 * disabled if no other client is using VPU service
201 * @ack_wq: The wait queue for each codec and mdp. When sleeping
202 * processes wake up, they will check the condition
203 * "ipi_id_ack" to run the corresponding action or
204 * go back to sleep.
205 * @ipi_id_ack: The ACKs for registered IPI function sending
206 * interrupt to VPU
207 *
208 */
209 struct mtk_vpu {
210 struct vpu_mem extmem[2];
211 struct vpu_regs reg;
212 struct vpu_run run;
213 struct vpu_wdt wdt;
214 struct vpu_ipi_desc ipi_desc[IPI_MAX];
215 struct share_obj __iomem *recv_buf;
216 struct share_obj __iomem *send_buf;
217 struct device *dev;
218 struct clk *clk;
219 bool fw_loaded;
220 bool enable_4GB;
221 struct mutex vpu_mutex; /* for protecting vpu data data structure */
222 u32 wdt_refcnt;
223 wait_queue_head_t ack_wq;
224 bool ipi_id_ack[IPI_MAX];
225 };
226
vpu_cfg_writel(struct mtk_vpu * vpu,u32 val,u32 offset)227 static inline void vpu_cfg_writel(struct mtk_vpu *vpu, u32 val, u32 offset)
228 {
229 writel(val, vpu->reg.cfg + offset);
230 }
231
vpu_cfg_readl(struct mtk_vpu * vpu,u32 offset)232 static inline u32 vpu_cfg_readl(struct mtk_vpu *vpu, u32 offset)
233 {
234 return readl(vpu->reg.cfg + offset);
235 }
236
vpu_running(struct mtk_vpu * vpu)237 static inline bool vpu_running(struct mtk_vpu *vpu)
238 {
239 return vpu_cfg_readl(vpu, VPU_RESET) & BIT(0);
240 }
241
vpu_clock_disable(struct mtk_vpu * vpu)242 static void vpu_clock_disable(struct mtk_vpu *vpu)
243 {
244 /* Disable VPU watchdog */
245 mutex_lock(&vpu->vpu_mutex);
246 if (!--vpu->wdt_refcnt)
247 vpu_cfg_writel(vpu,
248 vpu_cfg_readl(vpu, VPU_WDT_REG) & ~(1L << 31),
249 VPU_WDT_REG);
250 mutex_unlock(&vpu->vpu_mutex);
251
252 clk_disable(vpu->clk);
253 }
254
vpu_clock_enable(struct mtk_vpu * vpu)255 static int vpu_clock_enable(struct mtk_vpu *vpu)
256 {
257 int ret;
258
259 ret = clk_enable(vpu->clk);
260 if (ret)
261 return ret;
262 /* Enable VPU watchdog */
263 mutex_lock(&vpu->vpu_mutex);
264 if (!vpu->wdt_refcnt++)
265 vpu_cfg_writel(vpu,
266 vpu_cfg_readl(vpu, VPU_WDT_REG) | (1L << 31),
267 VPU_WDT_REG);
268 mutex_unlock(&vpu->vpu_mutex);
269
270 return ret;
271 }
272
vpu_dump_status(struct mtk_vpu * vpu)273 static void vpu_dump_status(struct mtk_vpu *vpu)
274 {
275 dev_info(vpu->dev,
276 "vpu: run %x, pc = 0x%x, ra = 0x%x, sp = 0x%x, idle = 0x%x\n"
277 "vpu: int %x, hv = 0x%x, vh = 0x%x, wdt = 0x%x\n",
278 vpu_running(vpu), vpu_cfg_readl(vpu, VPU_PC_REG),
279 vpu_cfg_readl(vpu, VPU_RA_REG), vpu_cfg_readl(vpu, VPU_SP_REG),
280 vpu_cfg_readl(vpu, VPU_IDLE_REG),
281 vpu_cfg_readl(vpu, VPU_INT_STATUS),
282 vpu_cfg_readl(vpu, HOST_TO_VPU),
283 vpu_cfg_readl(vpu, VPU_TO_HOST),
284 vpu_cfg_readl(vpu, VPU_WDT_REG));
285 }
286
vpu_ipi_register(struct platform_device * pdev,enum ipi_id id,ipi_handler_t handler,const char * name,void * priv)287 int vpu_ipi_register(struct platform_device *pdev,
288 enum ipi_id id, ipi_handler_t handler,
289 const char *name, void *priv)
290 {
291 struct mtk_vpu *vpu = platform_get_drvdata(pdev);
292 struct vpu_ipi_desc *ipi_desc;
293
294 if (!vpu) {
295 dev_err(&pdev->dev, "vpu device in not ready\n");
296 return -EPROBE_DEFER;
297 }
298
299 if (id < IPI_MAX && handler) {
300 ipi_desc = vpu->ipi_desc;
301 ipi_desc[id].name = name;
302 ipi_desc[id].handler = handler;
303 ipi_desc[id].priv = priv;
304 return 0;
305 }
306
307 dev_err(&pdev->dev, "register vpu ipi id %d with invalid arguments\n",
308 id);
309 return -EINVAL;
310 }
311 EXPORT_SYMBOL_GPL(vpu_ipi_register);
312
vpu_ipi_send(struct platform_device * pdev,enum ipi_id id,void * buf,unsigned int len)313 int vpu_ipi_send(struct platform_device *pdev,
314 enum ipi_id id, void *buf,
315 unsigned int len)
316 {
317 struct mtk_vpu *vpu = platform_get_drvdata(pdev);
318 struct share_obj __iomem *send_obj = vpu->send_buf;
319 unsigned long timeout;
320 int ret = 0;
321
322 if (id <= IPI_VPU_INIT || id >= IPI_MAX ||
323 len > sizeof(send_obj->share_buf) || !buf) {
324 dev_err(vpu->dev, "failed to send ipi message\n");
325 return -EINVAL;
326 }
327
328 ret = vpu_clock_enable(vpu);
329 if (ret) {
330 dev_err(vpu->dev, "failed to enable vpu clock\n");
331 return ret;
332 }
333 if (!vpu_running(vpu)) {
334 dev_err(vpu->dev, "vpu_ipi_send: VPU is not running\n");
335 ret = -EINVAL;
336 goto clock_disable;
337 }
338
339 mutex_lock(&vpu->vpu_mutex);
340
341 /* Wait until VPU receives the last command */
342 timeout = jiffies + msecs_to_jiffies(IPI_TIMEOUT_MS);
343 do {
344 if (time_after(jiffies, timeout)) {
345 dev_err(vpu->dev, "vpu_ipi_send: IPI timeout!\n");
346 ret = -EIO;
347 vpu_dump_status(vpu);
348 goto mut_unlock;
349 }
350 } while (vpu_cfg_readl(vpu, HOST_TO_VPU));
351
352 memcpy_toio(send_obj->share_buf, buf, len);
353 writel(len, &send_obj->len);
354 writel(id, &send_obj->id);
355
356 vpu->ipi_id_ack[id] = false;
357 /* send the command to VPU */
358 vpu_cfg_writel(vpu, 0x1, HOST_TO_VPU);
359
360 mutex_unlock(&vpu->vpu_mutex);
361
362 /* wait for VPU's ACK */
363 timeout = msecs_to_jiffies(IPI_TIMEOUT_MS);
364 ret = wait_event_timeout(vpu->ack_wq, vpu->ipi_id_ack[id], timeout);
365 vpu->ipi_id_ack[id] = false;
366 if (ret == 0) {
367 dev_err(vpu->dev, "vpu ipi %d ack time out !\n", id);
368 ret = -EIO;
369 vpu_dump_status(vpu);
370 goto clock_disable;
371 }
372 vpu_clock_disable(vpu);
373
374 return 0;
375
376 mut_unlock:
377 mutex_unlock(&vpu->vpu_mutex);
378 clock_disable:
379 vpu_clock_disable(vpu);
380
381 return ret;
382 }
383 EXPORT_SYMBOL_GPL(vpu_ipi_send);
384
vpu_wdt_reset_func(struct work_struct * ws)385 static void vpu_wdt_reset_func(struct work_struct *ws)
386 {
387 struct vpu_wdt *wdt = container_of(ws, struct vpu_wdt, ws);
388 struct mtk_vpu *vpu = container_of(wdt, struct mtk_vpu, wdt);
389 struct vpu_wdt_handler *handler = wdt->handler;
390 int index, ret;
391
392 dev_info(vpu->dev, "vpu reset\n");
393 ret = vpu_clock_enable(vpu);
394 if (ret) {
395 dev_err(vpu->dev, "[VPU] wdt enables clock failed %d\n", ret);
396 return;
397 }
398 mutex_lock(&vpu->vpu_mutex);
399 vpu_cfg_writel(vpu, 0x0, VPU_RESET);
400 vpu->fw_loaded = false;
401 mutex_unlock(&vpu->vpu_mutex);
402 vpu_clock_disable(vpu);
403
404 for (index = 0; index < VPU_RST_MAX; index++) {
405 if (handler[index].reset_func) {
406 handler[index].reset_func(handler[index].priv);
407 dev_dbg(vpu->dev, "wdt handler func %d\n", index);
408 }
409 }
410 }
411
vpu_wdt_reg_handler(struct platform_device * pdev,void wdt_reset (void *),void * priv,enum rst_id id)412 int vpu_wdt_reg_handler(struct platform_device *pdev,
413 void wdt_reset(void *),
414 void *priv, enum rst_id id)
415 {
416 struct mtk_vpu *vpu = platform_get_drvdata(pdev);
417 struct vpu_wdt_handler *handler;
418
419 if (!vpu) {
420 dev_err(&pdev->dev, "vpu device in not ready\n");
421 return -EPROBE_DEFER;
422 }
423
424 handler = vpu->wdt.handler;
425
426 if (id < VPU_RST_MAX && wdt_reset) {
427 dev_dbg(vpu->dev, "wdt register id %d\n", id);
428 mutex_lock(&vpu->vpu_mutex);
429 handler[id].reset_func = wdt_reset;
430 handler[id].priv = priv;
431 mutex_unlock(&vpu->vpu_mutex);
432 return 0;
433 }
434
435 dev_err(vpu->dev, "register vpu wdt handler failed\n");
436 return -EINVAL;
437 }
438 EXPORT_SYMBOL_GPL(vpu_wdt_reg_handler);
439
vpu_get_vdec_hw_capa(struct platform_device * pdev)440 unsigned int vpu_get_vdec_hw_capa(struct platform_device *pdev)
441 {
442 struct mtk_vpu *vpu = platform_get_drvdata(pdev);
443
444 return vpu->run.dec_capability;
445 }
446 EXPORT_SYMBOL_GPL(vpu_get_vdec_hw_capa);
447
vpu_get_venc_hw_capa(struct platform_device * pdev)448 unsigned int vpu_get_venc_hw_capa(struct platform_device *pdev)
449 {
450 struct mtk_vpu *vpu = platform_get_drvdata(pdev);
451
452 return vpu->run.enc_capability;
453 }
454 EXPORT_SYMBOL_GPL(vpu_get_venc_hw_capa);
455
vpu_mapping_dm_addr(struct platform_device * pdev,u32 dtcm_dmem_addr)456 void *vpu_mapping_dm_addr(struct platform_device *pdev,
457 u32 dtcm_dmem_addr)
458 {
459 struct mtk_vpu *vpu = platform_get_drvdata(pdev);
460
461 if (!dtcm_dmem_addr ||
462 (dtcm_dmem_addr > (VPU_DTCM_SIZE + VPU_EXT_D_SIZE))) {
463 dev_err(vpu->dev, "invalid virtual data memory address\n");
464 return ERR_PTR(-EINVAL);
465 }
466
467 if (dtcm_dmem_addr < VPU_DTCM_SIZE)
468 return (__force void *)(dtcm_dmem_addr + vpu->reg.tcm +
469 VPU_DTCM_OFFSET);
470
471 return vpu->extmem[D_FW].va + (dtcm_dmem_addr - VPU_DTCM_SIZE);
472 }
473 EXPORT_SYMBOL_GPL(vpu_mapping_dm_addr);
474
vpu_get_plat_device(struct platform_device * pdev)475 struct platform_device *vpu_get_plat_device(struct platform_device *pdev)
476 {
477 struct device *dev = &pdev->dev;
478 struct device_node *vpu_node;
479 struct platform_device *vpu_pdev;
480
481 vpu_node = of_parse_phandle(dev->of_node, "mediatek,vpu", 0);
482 if (!vpu_node) {
483 dev_err(dev, "can't get vpu node\n");
484 return NULL;
485 }
486
487 vpu_pdev = of_find_device_by_node(vpu_node);
488 of_node_put(vpu_node);
489 if (WARN_ON(!vpu_pdev)) {
490 dev_err(dev, "vpu pdev failed\n");
491 return NULL;
492 }
493
494 return vpu_pdev;
495 }
496 EXPORT_SYMBOL_GPL(vpu_get_plat_device);
497
498 /* load vpu program/data memory */
load_requested_vpu(struct mtk_vpu * vpu,u8 fw_type)499 static int load_requested_vpu(struct mtk_vpu *vpu,
500 u8 fw_type)
501 {
502 size_t tcm_size = fw_type ? VPU_DTCM_SIZE : VPU_PTCM_SIZE;
503 size_t fw_size = fw_type ? VPU_D_FW_SIZE : VPU_P_FW_SIZE;
504 char *fw_name = fw_type ? VPU_D_FW : VPU_P_FW;
505 char *fw_new_name = fw_type ? VPU_D_FW_NEW : VPU_P_FW_NEW;
506 const struct firmware *vpu_fw;
507 size_t dl_size = 0;
508 size_t extra_fw_size = 0;
509 void *dest;
510 int ret;
511
512 ret = request_firmware(&vpu_fw, fw_new_name, vpu->dev);
513 if (ret < 0) {
514 dev_info(vpu->dev, "Failed to load %s, %d, retry\n",
515 fw_new_name, ret);
516
517 ret = request_firmware(&vpu_fw, fw_name, vpu->dev);
518 if (ret < 0) {
519 dev_err(vpu->dev, "Failed to load %s, %d\n", fw_name,
520 ret);
521 return ret;
522 }
523 }
524 dl_size = vpu_fw->size;
525 if (dl_size > fw_size) {
526 dev_err(vpu->dev, "fw %s size %zu is abnormal\n", fw_name,
527 dl_size);
528 release_firmware(vpu_fw);
529 return -EFBIG;
530 }
531 dev_dbg(vpu->dev, "Downloaded fw %s size: %zu.\n",
532 fw_name,
533 dl_size);
534 /* reset VPU */
535 vpu_cfg_writel(vpu, 0x0, VPU_RESET);
536
537 /* handle extended firmware size */
538 if (dl_size > tcm_size) {
539 dev_dbg(vpu->dev, "fw size %zu > limited fw size %zu\n",
540 dl_size, tcm_size);
541 extra_fw_size = dl_size - tcm_size;
542 dev_dbg(vpu->dev, "extra_fw_size %zu\n", extra_fw_size);
543 dl_size = tcm_size;
544 }
545 dest = (__force void *)vpu->reg.tcm;
546 if (fw_type == D_FW)
547 dest += VPU_DTCM_OFFSET;
548 memcpy(dest, vpu_fw->data, dl_size);
549 /* download to extended memory if need */
550 if (extra_fw_size > 0) {
551 dest = vpu->extmem[fw_type].va;
552 dev_dbg(vpu->dev, "download extended memory type %x\n",
553 fw_type);
554 memcpy(dest, vpu_fw->data + tcm_size, extra_fw_size);
555 }
556
557 release_firmware(vpu_fw);
558
559 return 0;
560 }
561
vpu_load_firmware(struct platform_device * pdev)562 int vpu_load_firmware(struct platform_device *pdev)
563 {
564 struct mtk_vpu *vpu;
565 struct device *dev = &pdev->dev;
566 struct vpu_run *run;
567 int ret;
568
569 if (!pdev) {
570 dev_err(dev, "VPU platform device is invalid\n");
571 return -EINVAL;
572 }
573
574 vpu = platform_get_drvdata(pdev);
575 run = &vpu->run;
576
577 mutex_lock(&vpu->vpu_mutex);
578 if (vpu->fw_loaded) {
579 mutex_unlock(&vpu->vpu_mutex);
580 return 0;
581 }
582 mutex_unlock(&vpu->vpu_mutex);
583
584 ret = vpu_clock_enable(vpu);
585 if (ret) {
586 dev_err(dev, "enable clock failed %d\n", ret);
587 return ret;
588 }
589
590 mutex_lock(&vpu->vpu_mutex);
591
592 run->signaled = false;
593 dev_dbg(vpu->dev, "firmware request\n");
594 /* Downloading program firmware to device*/
595 ret = load_requested_vpu(vpu, P_FW);
596 if (ret < 0) {
597 dev_err(dev, "Failed to request %s, %d\n", VPU_P_FW, ret);
598 goto OUT_LOAD_FW;
599 }
600
601 /* Downloading data firmware to device */
602 ret = load_requested_vpu(vpu, D_FW);
603 if (ret < 0) {
604 dev_err(dev, "Failed to request %s, %d\n", VPU_D_FW, ret);
605 goto OUT_LOAD_FW;
606 }
607
608 vpu->fw_loaded = true;
609 /* boot up vpu */
610 vpu_cfg_writel(vpu, 0x1, VPU_RESET);
611
612 ret = wait_event_interruptible_timeout(run->wq,
613 run->signaled,
614 msecs_to_jiffies(INIT_TIMEOUT_MS)
615 );
616 if (ret == 0) {
617 ret = -ETIME;
618 dev_err(dev, "wait vpu initialization timeout!\n");
619 goto OUT_LOAD_FW;
620 } else if (-ERESTARTSYS == ret) {
621 dev_err(dev, "wait vpu interrupted by a signal!\n");
622 goto OUT_LOAD_FW;
623 }
624
625 ret = 0;
626 dev_info(dev, "vpu is ready. Fw version %s\n", run->fw_ver);
627
628 OUT_LOAD_FW:
629 mutex_unlock(&vpu->vpu_mutex);
630 vpu_clock_disable(vpu);
631
632 return ret;
633 }
634 EXPORT_SYMBOL_GPL(vpu_load_firmware);
635
vpu_init_ipi_handler(const void * data,unsigned int len,void * priv)636 static void vpu_init_ipi_handler(const void *data, unsigned int len, void *priv)
637 {
638 struct mtk_vpu *vpu = priv;
639 const struct vpu_run *run = data;
640
641 vpu->run.signaled = run->signaled;
642 strscpy(vpu->run.fw_ver, run->fw_ver, sizeof(vpu->run.fw_ver));
643 vpu->run.dec_capability = run->dec_capability;
644 vpu->run.enc_capability = run->enc_capability;
645 wake_up_interruptible(&vpu->run.wq);
646 }
647
648 #ifdef CONFIG_DEBUG_FS
vpu_debug_read(struct file * file,char __user * user_buf,size_t count,loff_t * ppos)649 static ssize_t vpu_debug_read(struct file *file, char __user *user_buf,
650 size_t count, loff_t *ppos)
651 {
652 char buf[256];
653 unsigned int len;
654 unsigned int running, pc, vpu_to_host, host_to_vpu, wdt, idle, ra, sp;
655 int ret;
656 struct device *dev = file->private_data;
657 struct mtk_vpu *vpu = dev_get_drvdata(dev);
658
659 ret = vpu_clock_enable(vpu);
660 if (ret) {
661 dev_err(vpu->dev, "[VPU] enable clock failed %d\n", ret);
662 return 0;
663 }
664
665 /* vpu register status */
666 running = vpu_running(vpu);
667 pc = vpu_cfg_readl(vpu, VPU_PC_REG);
668 wdt = vpu_cfg_readl(vpu, VPU_WDT_REG);
669 host_to_vpu = vpu_cfg_readl(vpu, HOST_TO_VPU);
670 vpu_to_host = vpu_cfg_readl(vpu, VPU_TO_HOST);
671 ra = vpu_cfg_readl(vpu, VPU_RA_REG);
672 sp = vpu_cfg_readl(vpu, VPU_SP_REG);
673 idle = vpu_cfg_readl(vpu, VPU_IDLE_REG);
674
675 vpu_clock_disable(vpu);
676
677 if (running) {
678 len = snprintf(buf, sizeof(buf), "VPU is running\n\n"
679 "FW Version: %s\n"
680 "PC: 0x%x\n"
681 "WDT: 0x%x\n"
682 "Host to VPU: 0x%x\n"
683 "VPU to Host: 0x%x\n"
684 "SP: 0x%x\n"
685 "RA: 0x%x\n"
686 "idle: 0x%x\n",
687 vpu->run.fw_ver, pc, wdt,
688 host_to_vpu, vpu_to_host, sp, ra, idle);
689 } else {
690 len = snprintf(buf, sizeof(buf), "VPU not running\n");
691 }
692
693 return simple_read_from_buffer(user_buf, count, ppos, buf, len);
694 }
695
696 static const struct file_operations vpu_debug_fops = {
697 .open = simple_open,
698 .read = vpu_debug_read,
699 };
700 #endif /* CONFIG_DEBUG_FS */
701
vpu_free_ext_mem(struct mtk_vpu * vpu,u8 fw_type)702 static void vpu_free_ext_mem(struct mtk_vpu *vpu, u8 fw_type)
703 {
704 struct device *dev = vpu->dev;
705 size_t fw_ext_size = fw_type ? VPU_EXT_D_SIZE : VPU_EXT_P_SIZE;
706
707 dma_free_coherent(dev, fw_ext_size, vpu->extmem[fw_type].va,
708 vpu->extmem[fw_type].pa);
709 }
710
vpu_alloc_ext_mem(struct mtk_vpu * vpu,u32 fw_type)711 static int vpu_alloc_ext_mem(struct mtk_vpu *vpu, u32 fw_type)
712 {
713 struct device *dev = vpu->dev;
714 size_t fw_ext_size = fw_type ? VPU_EXT_D_SIZE : VPU_EXT_P_SIZE;
715 u32 vpu_ext_mem0 = fw_type ? VPU_DMEM_EXT0_ADDR : VPU_PMEM_EXT0_ADDR;
716 u32 vpu_ext_mem1 = fw_type ? VPU_DMEM_EXT1_ADDR : VPU_PMEM_EXT1_ADDR;
717 u32 offset_4gb = vpu->enable_4GB ? 0x40000000 : 0;
718
719 vpu->extmem[fw_type].va = dma_alloc_coherent(dev,
720 fw_ext_size,
721 &vpu->extmem[fw_type].pa,
722 GFP_KERNEL);
723 if (!vpu->extmem[fw_type].va) {
724 dev_err(dev, "Failed to allocate the extended program memory\n");
725 return -ENOMEM;
726 }
727
728 /* Disable extend0. Enable extend1 */
729 vpu_cfg_writel(vpu, 0x1, vpu_ext_mem0);
730 vpu_cfg_writel(vpu, (vpu->extmem[fw_type].pa & 0xFFFFF000) + offset_4gb,
731 vpu_ext_mem1);
732
733 dev_info(dev, "%s extend memory phy=0x%llx virt=0x%p\n",
734 fw_type ? "Data" : "Program",
735 (unsigned long long)vpu->extmem[fw_type].pa,
736 vpu->extmem[fw_type].va);
737
738 return 0;
739 }
740
vpu_ipi_handler(struct mtk_vpu * vpu)741 static void vpu_ipi_handler(struct mtk_vpu *vpu)
742 {
743 struct share_obj __iomem *rcv_obj = vpu->recv_buf;
744 struct vpu_ipi_desc *ipi_desc = vpu->ipi_desc;
745 unsigned char data[SHARE_BUF_SIZE];
746 s32 id = readl(&rcv_obj->id);
747
748 memcpy_fromio(data, rcv_obj->share_buf, sizeof(data));
749 if (id < IPI_MAX && ipi_desc[id].handler) {
750 ipi_desc[id].handler(data, readl(&rcv_obj->len),
751 ipi_desc[id].priv);
752 if (id > IPI_VPU_INIT) {
753 vpu->ipi_id_ack[id] = true;
754 wake_up(&vpu->ack_wq);
755 }
756 } else {
757 dev_err(vpu->dev, "No such ipi id = %d\n", id);
758 }
759 }
760
vpu_ipi_init(struct mtk_vpu * vpu)761 static int vpu_ipi_init(struct mtk_vpu *vpu)
762 {
763 /* Disable VPU to host interrupt */
764 vpu_cfg_writel(vpu, 0x0, VPU_TO_HOST);
765
766 /* shared buffer initialization */
767 vpu->recv_buf = vpu->reg.tcm + VPU_DTCM_OFFSET;
768 vpu->send_buf = vpu->recv_buf + 1;
769 memset_io(vpu->recv_buf, 0, sizeof(struct share_obj));
770 memset_io(vpu->send_buf, 0, sizeof(struct share_obj));
771
772 return 0;
773 }
774
vpu_irq_handler(int irq,void * priv)775 static irqreturn_t vpu_irq_handler(int irq, void *priv)
776 {
777 struct mtk_vpu *vpu = priv;
778 u32 vpu_to_host;
779 int ret;
780
781 /*
782 * Clock should have been enabled already.
783 * Enable again in case vpu_ipi_send times out
784 * and has disabled the clock.
785 */
786 ret = clk_enable(vpu->clk);
787 if (ret) {
788 dev_err(vpu->dev, "[VPU] enable clock failed %d\n", ret);
789 return IRQ_NONE;
790 }
791 vpu_to_host = vpu_cfg_readl(vpu, VPU_TO_HOST);
792 if (vpu_to_host & VPU_IPC_INT) {
793 vpu_ipi_handler(vpu);
794 } else {
795 dev_err(vpu->dev, "vpu watchdog timeout! 0x%x", vpu_to_host);
796 queue_work(vpu->wdt.wq, &vpu->wdt.ws);
797 }
798
799 /* VPU won't send another interrupt until we set VPU_TO_HOST to 0. */
800 vpu_cfg_writel(vpu, 0x0, VPU_TO_HOST);
801 clk_disable(vpu->clk);
802
803 return IRQ_HANDLED;
804 }
805
806 #ifdef CONFIG_DEBUG_FS
807 static struct dentry *vpu_debugfs;
808 #endif
mtk_vpu_probe(struct platform_device * pdev)809 static int mtk_vpu_probe(struct platform_device *pdev)
810 {
811 struct mtk_vpu *vpu;
812 struct device *dev;
813 int ret = 0;
814
815 dev_dbg(&pdev->dev, "initialization\n");
816
817 dev = &pdev->dev;
818 vpu = devm_kzalloc(dev, sizeof(*vpu), GFP_KERNEL);
819 if (!vpu)
820 return -ENOMEM;
821
822 vpu->dev = &pdev->dev;
823 vpu->reg.tcm = devm_platform_ioremap_resource_byname(pdev, "tcm");
824 if (IS_ERR((__force void *)vpu->reg.tcm))
825 return PTR_ERR((__force void *)vpu->reg.tcm);
826
827 vpu->reg.cfg = devm_platform_ioremap_resource_byname(pdev, "cfg_reg");
828 if (IS_ERR((__force void *)vpu->reg.cfg))
829 return PTR_ERR((__force void *)vpu->reg.cfg);
830
831 /* Get VPU clock */
832 vpu->clk = devm_clk_get(dev, "main");
833 if (IS_ERR(vpu->clk)) {
834 dev_err(dev, "get vpu clock failed\n");
835 return PTR_ERR(vpu->clk);
836 }
837
838 platform_set_drvdata(pdev, vpu);
839
840 ret = clk_prepare(vpu->clk);
841 if (ret) {
842 dev_err(dev, "prepare vpu clock failed\n");
843 return ret;
844 }
845
846 /* VPU watchdog */
847 vpu->wdt.wq = create_singlethread_workqueue("vpu_wdt");
848 if (!vpu->wdt.wq) {
849 dev_err(dev, "initialize wdt workqueue failed\n");
850 ret = -ENOMEM;
851 goto clk_unprepare;
852 }
853 INIT_WORK(&vpu->wdt.ws, vpu_wdt_reset_func);
854 mutex_init(&vpu->vpu_mutex);
855
856 ret = vpu_clock_enable(vpu);
857 if (ret) {
858 dev_err(dev, "enable vpu clock failed\n");
859 goto workqueue_destroy;
860 }
861
862 dev_dbg(dev, "vpu ipi init\n");
863 ret = vpu_ipi_init(vpu);
864 if (ret) {
865 dev_err(dev, "Failed to init ipi\n");
866 goto disable_vpu_clk;
867 }
868
869 /* register vpu initialization IPI */
870 ret = vpu_ipi_register(pdev, IPI_VPU_INIT, vpu_init_ipi_handler,
871 "vpu_init", vpu);
872 if (ret) {
873 dev_err(dev, "Failed to register IPI_VPU_INIT\n");
874 goto vpu_mutex_destroy;
875 }
876
877 #ifdef CONFIG_DEBUG_FS
878 vpu_debugfs = debugfs_create_file("mtk_vpu", S_IRUGO, NULL, (void *)dev,
879 &vpu_debug_fops);
880 #endif
881
882 /* Set PTCM to 96K and DTCM to 32K */
883 vpu_cfg_writel(vpu, 0x2, VPU_TCM_CFG);
884
885 vpu->enable_4GB = !!(totalram_pages() > (SZ_2G >> PAGE_SHIFT));
886 dev_info(dev, "4GB mode %u\n", vpu->enable_4GB);
887
888 if (vpu->enable_4GB) {
889 ret = of_reserved_mem_device_init(dev);
890 if (ret)
891 dev_info(dev, "init reserved memory failed\n");
892 /* continue to use dynamic allocation if failed */
893 }
894
895 ret = vpu_alloc_ext_mem(vpu, D_FW);
896 if (ret) {
897 dev_err(dev, "Allocate DM failed\n");
898 goto remove_debugfs;
899 }
900
901 ret = vpu_alloc_ext_mem(vpu, P_FW);
902 if (ret) {
903 dev_err(dev, "Allocate PM failed\n");
904 goto free_d_mem;
905 }
906
907 init_waitqueue_head(&vpu->run.wq);
908 init_waitqueue_head(&vpu->ack_wq);
909
910 ret = platform_get_irq(pdev, 0);
911 if (ret < 0)
912 goto free_p_mem;
913 vpu->reg.irq = ret;
914 ret = devm_request_irq(dev, vpu->reg.irq, vpu_irq_handler, 0,
915 pdev->name, vpu);
916 if (ret) {
917 dev_err(dev, "failed to request irq\n");
918 goto free_p_mem;
919 }
920
921 vpu_clock_disable(vpu);
922 dev_dbg(dev, "initialization completed\n");
923
924 return 0;
925
926 free_p_mem:
927 vpu_free_ext_mem(vpu, P_FW);
928 free_d_mem:
929 vpu_free_ext_mem(vpu, D_FW);
930 remove_debugfs:
931 of_reserved_mem_device_release(dev);
932 #ifdef CONFIG_DEBUG_FS
933 debugfs_remove(vpu_debugfs);
934 #endif
935 memset(vpu->ipi_desc, 0, sizeof(struct vpu_ipi_desc) * IPI_MAX);
936 vpu_mutex_destroy:
937 mutex_destroy(&vpu->vpu_mutex);
938 disable_vpu_clk:
939 vpu_clock_disable(vpu);
940 workqueue_destroy:
941 destroy_workqueue(vpu->wdt.wq);
942 clk_unprepare:
943 clk_unprepare(vpu->clk);
944
945 return ret;
946 }
947
948 static const struct of_device_id mtk_vpu_match[] = {
949 {
950 .compatible = "mediatek,mt8173-vpu",
951 },
952 {},
953 };
954 MODULE_DEVICE_TABLE(of, mtk_vpu_match);
955
mtk_vpu_remove(struct platform_device * pdev)956 static int mtk_vpu_remove(struct platform_device *pdev)
957 {
958 struct mtk_vpu *vpu = platform_get_drvdata(pdev);
959
960 #ifdef CONFIG_DEBUG_FS
961 debugfs_remove(vpu_debugfs);
962 #endif
963 if (vpu->wdt.wq)
964 destroy_workqueue(vpu->wdt.wq);
965 vpu_free_ext_mem(vpu, P_FW);
966 vpu_free_ext_mem(vpu, D_FW);
967 mutex_destroy(&vpu->vpu_mutex);
968 clk_unprepare(vpu->clk);
969
970 return 0;
971 }
972
mtk_vpu_suspend(struct device * dev)973 static int mtk_vpu_suspend(struct device *dev)
974 {
975 struct mtk_vpu *vpu = dev_get_drvdata(dev);
976 unsigned long timeout;
977 int ret;
978
979 ret = vpu_clock_enable(vpu);
980 if (ret) {
981 dev_err(dev, "failed to enable vpu clock\n");
982 return ret;
983 }
984
985 if (!vpu_running(vpu)) {
986 vpu_clock_disable(vpu);
987 clk_unprepare(vpu->clk);
988 return 0;
989 }
990
991 mutex_lock(&vpu->vpu_mutex);
992 /* disable vpu timer interrupt */
993 vpu_cfg_writel(vpu, vpu_cfg_readl(vpu, VPU_INT_STATUS) | VPU_IDLE_STATE,
994 VPU_INT_STATUS);
995 /* check if vpu is idle for system suspend */
996 timeout = jiffies + msecs_to_jiffies(VPU_IDLE_TIMEOUT_MS);
997 do {
998 if (time_after(jiffies, timeout)) {
999 dev_err(dev, "vpu idle timeout\n");
1000 mutex_unlock(&vpu->vpu_mutex);
1001 vpu_clock_disable(vpu);
1002 return -EIO;
1003 }
1004 } while (!vpu_cfg_readl(vpu, VPU_IDLE_REG));
1005
1006 mutex_unlock(&vpu->vpu_mutex);
1007 vpu_clock_disable(vpu);
1008 clk_unprepare(vpu->clk);
1009
1010 return 0;
1011 }
1012
mtk_vpu_resume(struct device * dev)1013 static int mtk_vpu_resume(struct device *dev)
1014 {
1015 struct mtk_vpu *vpu = dev_get_drvdata(dev);
1016 int ret;
1017
1018 clk_prepare(vpu->clk);
1019 ret = vpu_clock_enable(vpu);
1020 if (ret) {
1021 dev_err(dev, "failed to enable vpu clock\n");
1022 return ret;
1023 }
1024
1025 mutex_lock(&vpu->vpu_mutex);
1026 /* enable vpu timer interrupt */
1027 vpu_cfg_writel(vpu,
1028 vpu_cfg_readl(vpu, VPU_INT_STATUS) & ~(VPU_IDLE_STATE),
1029 VPU_INT_STATUS);
1030 mutex_unlock(&vpu->vpu_mutex);
1031 vpu_clock_disable(vpu);
1032
1033 return 0;
1034 }
1035
1036 static const struct dev_pm_ops mtk_vpu_pm = {
1037 .suspend = mtk_vpu_suspend,
1038 .resume = mtk_vpu_resume,
1039 };
1040
1041 static struct platform_driver mtk_vpu_driver = {
1042 .probe = mtk_vpu_probe,
1043 .remove = mtk_vpu_remove,
1044 .driver = {
1045 .name = "mtk_vpu",
1046 .pm = &mtk_vpu_pm,
1047 .of_match_table = mtk_vpu_match,
1048 },
1049 };
1050
1051 module_platform_driver(mtk_vpu_driver);
1052
1053 MODULE_LICENSE("GPL v2");
1054 MODULE_DESCRIPTION("Mediatek Video Processor Unit driver");
1055