1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * Copyright (c) 2016 MediaTek Inc.
4  * Author: Daniel Hsiao <daniel.hsiao@mediatek.com>
5  *	Kai-Sean Yang <kai-sean.yang@mediatek.com>
6  *	Tiffany Lin <tiffany.lin@mediatek.com>
7  */
8 
9 #include <linux/fs.h>
10 #include <linux/slab.h>
11 #include <linux/syscalls.h>
12 #include <linux/delay.h>
13 #include <linux/time.h>
14 
15 #include "../mtk_vcodec_intr.h"
16 #include "../vdec_drv_base.h"
17 #include "../vdec_vpu_if.h"
18 
19 #define VP9_SUPER_FRAME_BS_SZ 64
20 #define MAX_VP9_DPB_SIZE	9
21 
22 #define REFS_PER_FRAME 3
23 #define MAX_NUM_REF_FRAMES 8
24 #define VP9_MAX_FRM_BUF_NUM 9
25 #define VP9_MAX_FRM_BUF_NODE_NUM (VP9_MAX_FRM_BUF_NUM * 2)
26 #define VP9_SEG_ID_SZ 0x12000
27 
28 /**
29  * struct vp9_dram_buf - contains buffer info for vpu
30  * @va : cpu address
31  * @pa : iova address
32  * @sz : buffer size
33  * @padding : for 64 bytes alignment
34  */
35 struct vp9_dram_buf {
36 	unsigned long va;
37 	unsigned long pa;
38 	unsigned int sz;
39 	unsigned int padding;
40 };
41 
42 /**
43  * struct vp9_fb_info - contains frame buffer info
44  * @fb : frmae buffer
45  * @reserved : reserved field used by vpu
46  */
47 struct vp9_fb_info {
48 	struct vdec_fb *fb;
49 	unsigned int reserved[32];
50 };
51 
52 /**
53  * struct vp9_ref_cnt_buf - contains reference buffer information
54  * @buf : referenced frame buffer
55  * @ref_cnt : referenced frame buffer's reference count.
56  *	When reference count=0, remove it from reference list
57  */
58 struct vp9_ref_cnt_buf {
59 	struct vp9_fb_info buf;
60 	unsigned int ref_cnt;
61 };
62 
63 /**
64  * struct vp9_ref_buf - contains current frame's reference buffer information
65  * @buf : reference buffer
66  * @idx : reference buffer index to frm_bufs
67  * @reserved : reserved field used by vpu
68  */
69 struct vp9_ref_buf {
70 	struct vp9_fb_info *buf;
71 	unsigned int idx;
72 	unsigned int reserved[6];
73 };
74 
75 /**
76  * struct vp9_sf_ref_fb - contains frame buffer info
77  * @fb : super frame reference frame buffer
78  * @used : this reference frame info entry is used
79  * @padding : for 64 bytes size align
80  */
81 struct vp9_sf_ref_fb {
82 	struct vdec_fb fb;
83 	int used;
84 	int padding;
85 };
86 
87 /*
88  * struct vdec_vp9_vsi - shared buffer between host and VPU firmware
89  *	AP-W/R : AP is writer/reader on this item
90  *	VPU-W/R: VPU is write/reader on this item
91  * @sf_bs_buf : super frame backup buffer (AP-W, VPU-R)
92  * @sf_ref_fb : record supoer frame reference buffer information
93  *	(AP-R/W, VPU-R/W)
94  * @sf_next_ref_fb_idx : next available super frame (AP-W, VPU-R)
95  * @sf_frm_cnt : super frame count, filled by vpu (AP-R, VPU-W)
96  * @sf_frm_offset : super frame offset, filled by vpu (AP-R, VPU-W)
97  * @sf_frm_sz : super frame size, filled by vpu (AP-R, VPU-W)
98  * @sf_frm_idx : current super frame (AP-R, VPU-W)
99  * @sf_init : inform super frame info already parsed by vpu (AP-R, VPU-W)
100  * @fb : capture buffer (AP-W, VPU-R)
101  * @bs : bs buffer (AP-W, VPU-R)
102  * @cur_fb : current show capture buffer (AP-R/W, VPU-R/W)
103  * @pic_w : picture width (AP-R, VPU-W)
104  * @pic_h : picture height (AP-R, VPU-W)
105  * @buf_w : codec width (AP-R, VPU-W)
106  * @buf_h : coded height (AP-R, VPU-W)
107  * @buf_sz_y_bs : ufo compressed y plane size (AP-R, VPU-W)
108  * @buf_sz_c_bs : ufo compressed cbcr plane size (AP-R, VPU-W)
109  * @buf_len_sz_y : size used to store y plane ufo info (AP-R, VPU-W)
110  * @buf_len_sz_c : size used to store cbcr plane ufo info (AP-R, VPU-W)
111 
112  * @profile : profile sparsed from vpu (AP-R, VPU-W)
113  * @show_frame : [BIT(0)] display this frame or not (AP-R, VPU-W)
114  *	[BIT(1)] reset segment data or not (AP-R, VPU-W)
115  *	[BIT(2)] trig decoder hardware or not (AP-R, VPU-W)
116  *	[BIT(3)] ask VPU to set bits(0~4) accordingly (AP-W, VPU-R)
117  *	[BIT(4)] do not reset segment data before every frame (AP-R, VPU-W)
118  * @show_existing_frame : inform this frame is show existing frame
119  *	(AP-R, VPU-W)
120  * @frm_to_show_idx : index to show frame (AP-R, VPU-W)
121 
122  * @refresh_frm_flags : indicate when frame need to refine reference count
123  *	(AP-R, VPU-W)
124  * @resolution_changed : resolution change in this frame (AP-R, VPU-W)
125 
126  * @frm_bufs : maintain reference buffer info (AP-R/W, VPU-R/W)
127  * @ref_frm_map : maintain reference buffer map info (AP-R/W, VPU-R/W)
128  * @new_fb_idx : index to frm_bufs array (AP-R, VPU-W)
129  * @frm_num : decoded frame number, include sub-frame count (AP-R, VPU-W)
130  * @mv_buf : motion vector working buffer (AP-W, VPU-R)
131  * @frm_refs : maintain three reference buffer info (AP-R/W, VPU-R/W)
132  * @seg_id_buf : segmentation map working buffer (AP-W, VPU-R)
133  */
134 struct vdec_vp9_vsi {
135 	unsigned char sf_bs_buf[VP9_SUPER_FRAME_BS_SZ];
136 	struct vp9_sf_ref_fb sf_ref_fb[VP9_MAX_FRM_BUF_NUM-1];
137 	int sf_next_ref_fb_idx;
138 	unsigned int sf_frm_cnt;
139 	unsigned int sf_frm_offset[VP9_MAX_FRM_BUF_NUM-1];
140 	unsigned int sf_frm_sz[VP9_MAX_FRM_BUF_NUM-1];
141 	unsigned int sf_frm_idx;
142 	unsigned int sf_init;
143 	struct vdec_fb fb;
144 	struct mtk_vcodec_mem bs;
145 	struct vdec_fb cur_fb;
146 	unsigned int pic_w;
147 	unsigned int pic_h;
148 	unsigned int buf_w;
149 	unsigned int buf_h;
150 	unsigned int buf_sz_y_bs;
151 	unsigned int buf_sz_c_bs;
152 	unsigned int buf_len_sz_y;
153 	unsigned int buf_len_sz_c;
154 	unsigned int profile;
155 	unsigned int show_frame;
156 	unsigned int show_existing_frame;
157 	unsigned int frm_to_show_idx;
158 	unsigned int refresh_frm_flags;
159 	unsigned int resolution_changed;
160 
161 	struct vp9_ref_cnt_buf frm_bufs[VP9_MAX_FRM_BUF_NUM];
162 	int ref_frm_map[MAX_NUM_REF_FRAMES];
163 	unsigned int new_fb_idx;
164 	unsigned int frm_num;
165 	struct vp9_dram_buf mv_buf;
166 
167 	struct vp9_ref_buf frm_refs[REFS_PER_FRAME];
168 	struct vp9_dram_buf seg_id_buf;
169 
170 };
171 
172 /*
173  * struct vdec_vp9_inst - vp9 decode instance
174  * @mv_buf : working buffer for mv
175  * @seg_id_buf : working buffer for segmentation map
176  * @dec_fb : vdec_fb node to link fb to different fb_xxx_list
177  * @available_fb_node_list : current available vdec_fb node
178  * @fb_use_list : current used or referenced vdec_fb
179  * @fb_free_list : current available to free vdec_fb
180  * @fb_disp_list : current available to display vdec_fb
181  * @cur_fb : current frame buffer
182  * @ctx : current decode context
183  * @vpu : vpu instance information
184  * @vsi : shared buffer between host and VPU firmware
185  * @total_frm_cnt : total frame count, it do not include sub-frames in super
186  *	    frame
187  * @mem : instance memory information
188  */
189 struct vdec_vp9_inst {
190 	struct mtk_vcodec_mem mv_buf;
191 	struct mtk_vcodec_mem seg_id_buf;
192 
193 	struct vdec_fb_node dec_fb[VP9_MAX_FRM_BUF_NODE_NUM];
194 	struct list_head available_fb_node_list;
195 	struct list_head fb_use_list;
196 	struct list_head fb_free_list;
197 	struct list_head fb_disp_list;
198 	struct vdec_fb *cur_fb;
199 	struct mtk_vcodec_ctx *ctx;
200 	struct vdec_vpu_inst vpu;
201 	struct vdec_vp9_vsi *vsi;
202 	unsigned int total_frm_cnt;
203 	struct mtk_vcodec_mem mem;
204 };
205 
vp9_is_sf_ref_fb(struct vdec_vp9_inst * inst,struct vdec_fb * fb)206 static bool vp9_is_sf_ref_fb(struct vdec_vp9_inst *inst, struct vdec_fb *fb)
207 {
208 	int i;
209 	struct vdec_vp9_vsi *vsi = inst->vsi;
210 
211 	for (i = 0; i < ARRAY_SIZE(vsi->sf_ref_fb); i++) {
212 		if (fb == &vsi->sf_ref_fb[i].fb)
213 			return true;
214 	}
215 	return false;
216 }
217 
vp9_rm_from_fb_use_list(struct vdec_vp9_inst * inst,void * addr)218 static struct vdec_fb *vp9_rm_from_fb_use_list(struct vdec_vp9_inst
219 					*inst, void *addr)
220 {
221 	struct vdec_fb *fb = NULL;
222 	struct vdec_fb_node *node;
223 
224 	list_for_each_entry(node, &inst->fb_use_list, list) {
225 		fb = (struct vdec_fb *)node->fb;
226 		if (fb->base_y.va == addr) {
227 			list_move_tail(&node->list,
228 				       &inst->available_fb_node_list);
229 			break;
230 		}
231 	}
232 	return fb;
233 }
234 
vp9_add_to_fb_free_list(struct vdec_vp9_inst * inst,struct vdec_fb * fb)235 static void vp9_add_to_fb_free_list(struct vdec_vp9_inst *inst,
236 			     struct vdec_fb *fb)
237 {
238 	struct vdec_fb_node *node;
239 
240 	if (fb) {
241 		node = list_first_entry_or_null(&inst->available_fb_node_list,
242 					struct vdec_fb_node, list);
243 
244 		if (node) {
245 			node->fb = fb;
246 			list_move_tail(&node->list, &inst->fb_free_list);
247 		}
248 	} else {
249 		mtk_vcodec_debug(inst, "No free fb node");
250 	}
251 }
252 
vp9_free_sf_ref_fb(struct vdec_fb * fb)253 static void vp9_free_sf_ref_fb(struct vdec_fb *fb)
254 {
255 	struct vp9_sf_ref_fb *sf_ref_fb =
256 		container_of(fb, struct vp9_sf_ref_fb, fb);
257 
258 	sf_ref_fb->used = 0;
259 }
260 
vp9_ref_cnt_fb(struct vdec_vp9_inst * inst,int * idx,int new_idx)261 static void vp9_ref_cnt_fb(struct vdec_vp9_inst *inst, int *idx,
262 			   int new_idx)
263 {
264 	struct vdec_vp9_vsi *vsi = inst->vsi;
265 	int ref_idx = *idx;
266 
267 	if (ref_idx >= 0 && vsi->frm_bufs[ref_idx].ref_cnt > 0) {
268 		vsi->frm_bufs[ref_idx].ref_cnt--;
269 
270 		if (vsi->frm_bufs[ref_idx].ref_cnt == 0) {
271 			if (!vp9_is_sf_ref_fb(inst,
272 					      vsi->frm_bufs[ref_idx].buf.fb)) {
273 				struct vdec_fb *fb;
274 
275 				fb = vp9_rm_from_fb_use_list(inst,
276 				     vsi->frm_bufs[ref_idx].buf.fb->base_y.va);
277 				vp9_add_to_fb_free_list(inst, fb);
278 			} else
279 				vp9_free_sf_ref_fb(
280 					vsi->frm_bufs[ref_idx].buf.fb);
281 		}
282 	}
283 
284 	*idx = new_idx;
285 	vsi->frm_bufs[new_idx].ref_cnt++;
286 }
287 
vp9_free_all_sf_ref_fb(struct vdec_vp9_inst * inst)288 static void vp9_free_all_sf_ref_fb(struct vdec_vp9_inst *inst)
289 {
290 	int i;
291 	struct vdec_vp9_vsi *vsi = inst->vsi;
292 
293 	for (i = 0; i < ARRAY_SIZE(vsi->sf_ref_fb); i++) {
294 		if (vsi->sf_ref_fb[i].fb.base_y.va) {
295 			mtk_vcodec_mem_free(inst->ctx,
296 				&vsi->sf_ref_fb[i].fb.base_y);
297 			mtk_vcodec_mem_free(inst->ctx,
298 				&vsi->sf_ref_fb[i].fb.base_c);
299 			vsi->sf_ref_fb[i].used = 0;
300 		}
301 	}
302 }
303 
304 /* For each sub-frame except the last one, the driver will dynamically
305  * allocate reference buffer by calling vp9_get_sf_ref_fb()
306  * The last sub-frame will use the original fb provided by the
307  * vp9_dec_decode() interface
308  */
vp9_get_sf_ref_fb(struct vdec_vp9_inst * inst)309 static int vp9_get_sf_ref_fb(struct vdec_vp9_inst *inst)
310 {
311 	int idx;
312 	struct mtk_vcodec_mem *mem_basy_y;
313 	struct mtk_vcodec_mem *mem_basy_c;
314 	struct vdec_vp9_vsi *vsi = inst->vsi;
315 
316 	for (idx = 0;
317 		idx < ARRAY_SIZE(vsi->sf_ref_fb);
318 		idx++) {
319 		if (vsi->sf_ref_fb[idx].fb.base_y.va &&
320 		    vsi->sf_ref_fb[idx].used == 0) {
321 			return idx;
322 		}
323 	}
324 
325 	for (idx = 0;
326 		idx < ARRAY_SIZE(vsi->sf_ref_fb);
327 		idx++) {
328 		if (vsi->sf_ref_fb[idx].fb.base_y.va == NULL)
329 			break;
330 	}
331 
332 	if (idx == ARRAY_SIZE(vsi->sf_ref_fb)) {
333 		mtk_vcodec_err(inst, "List Full");
334 		return -1;
335 	}
336 
337 	mem_basy_y = &vsi->sf_ref_fb[idx].fb.base_y;
338 	mem_basy_y->size = vsi->buf_sz_y_bs +
339 		vsi->buf_len_sz_y;
340 
341 	if (mtk_vcodec_mem_alloc(inst->ctx, mem_basy_y)) {
342 		mtk_vcodec_err(inst, "Cannot allocate sf_ref_buf y_buf");
343 		return -1;
344 	}
345 
346 	mem_basy_c = &vsi->sf_ref_fb[idx].fb.base_c;
347 	mem_basy_c->size = vsi->buf_sz_c_bs +
348 		vsi->buf_len_sz_c;
349 
350 	if (mtk_vcodec_mem_alloc(inst->ctx, mem_basy_c)) {
351 		mtk_vcodec_err(inst, "Cannot allocate sf_ref_fb c_buf");
352 		return -1;
353 	}
354 	vsi->sf_ref_fb[idx].used = 0;
355 
356 	return idx;
357 }
358 
vp9_alloc_work_buf(struct vdec_vp9_inst * inst)359 static bool vp9_alloc_work_buf(struct vdec_vp9_inst *inst)
360 {
361 	struct vdec_vp9_vsi *vsi = inst->vsi;
362 	int result;
363 	struct mtk_vcodec_mem *mem;
364 
365 	unsigned int max_pic_w;
366 	unsigned int max_pic_h;
367 
368 
369 	if (!(inst->ctx->dev->dec_capability &
370 		VCODEC_CAPABILITY_4K_DISABLED)) {
371 		max_pic_w = VCODEC_DEC_4K_CODED_WIDTH;
372 		max_pic_h = VCODEC_DEC_4K_CODED_HEIGHT;
373 	} else {
374 		max_pic_w = MTK_VDEC_MAX_W;
375 		max_pic_h = MTK_VDEC_MAX_H;
376 	}
377 
378 	if ((vsi->pic_w > max_pic_w) ||
379 		(vsi->pic_h > max_pic_h)) {
380 		mtk_vcodec_err(inst, "Invalid w/h %d/%d",
381 				vsi->pic_w, vsi->pic_h);
382 		return false;
383 	}
384 
385 	mtk_vcodec_debug(inst, "BUF CHG(%d): w/h/sb_w/sb_h=%d/%d/%d/%d",
386 			vsi->resolution_changed,
387 			vsi->pic_w,
388 			vsi->pic_h,
389 			vsi->buf_w,
390 			vsi->buf_h);
391 
392 	mem = &inst->mv_buf;
393 	if (mem->va)
394 		mtk_vcodec_mem_free(inst->ctx, mem);
395 
396 	mem->size = ((vsi->buf_w / 64) *
397 		    (vsi->buf_h / 64) + 2) * 36 * 16;
398 	result = mtk_vcodec_mem_alloc(inst->ctx, mem);
399 	if (result) {
400 		mem->size = 0;
401 		mtk_vcodec_err(inst, "Cannot allocate mv_buf");
402 		return false;
403 	}
404 	/* Set the va again */
405 	vsi->mv_buf.va = (unsigned long)mem->va;
406 	vsi->mv_buf.pa = (unsigned long)mem->dma_addr;
407 	vsi->mv_buf.sz = (unsigned int)mem->size;
408 
409 
410 	mem = &inst->seg_id_buf;
411 	if (mem->va)
412 		mtk_vcodec_mem_free(inst->ctx, mem);
413 
414 	mem->size = VP9_SEG_ID_SZ;
415 	result = mtk_vcodec_mem_alloc(inst->ctx, mem);
416 	if (result) {
417 		mem->size = 0;
418 		mtk_vcodec_err(inst, "Cannot allocate seg_id_buf");
419 		return false;
420 	}
421 	/* Set the va again */
422 	vsi->seg_id_buf.va = (unsigned long)mem->va;
423 	vsi->seg_id_buf.pa = (unsigned long)mem->dma_addr;
424 	vsi->seg_id_buf.sz = (unsigned int)mem->size;
425 
426 
427 	vp9_free_all_sf_ref_fb(inst);
428 	vsi->sf_next_ref_fb_idx = vp9_get_sf_ref_fb(inst);
429 
430 	return true;
431 }
432 
vp9_add_to_fb_disp_list(struct vdec_vp9_inst * inst,struct vdec_fb * fb)433 static bool vp9_add_to_fb_disp_list(struct vdec_vp9_inst *inst,
434 			     struct vdec_fb *fb)
435 {
436 	struct vdec_fb_node *node;
437 
438 	if (!fb) {
439 		mtk_vcodec_err(inst, "fb == NULL");
440 		return false;
441 	}
442 
443 	node = list_first_entry_or_null(&inst->available_fb_node_list,
444 					struct vdec_fb_node, list);
445 	if (node) {
446 		node->fb = fb;
447 		list_move_tail(&node->list, &inst->fb_disp_list);
448 	} else {
449 		mtk_vcodec_err(inst, "No available fb node");
450 		return false;
451 	}
452 
453 	return true;
454 }
455 
456 /* If any buffer updating is signaled it should be done here. */
vp9_swap_frm_bufs(struct vdec_vp9_inst * inst)457 static void vp9_swap_frm_bufs(struct vdec_vp9_inst *inst)
458 {
459 	struct vdec_vp9_vsi *vsi = inst->vsi;
460 	struct vp9_fb_info *frm_to_show;
461 	int ref_index = 0, mask;
462 
463 	for (mask = vsi->refresh_frm_flags; mask; mask >>= 1) {
464 		if (mask & 1)
465 			vp9_ref_cnt_fb(inst, &vsi->ref_frm_map[ref_index],
466 				       vsi->new_fb_idx);
467 		++ref_index;
468 	}
469 
470 	frm_to_show = &vsi->frm_bufs[vsi->new_fb_idx].buf;
471 	vsi->frm_bufs[vsi->new_fb_idx].ref_cnt--;
472 
473 	if (frm_to_show->fb != inst->cur_fb) {
474 		/* This frame is show exist frame and no decode output
475 		 * copy frame data from frm_to_show to current CAPTURE
476 		 * buffer
477 		 */
478 		if ((frm_to_show->fb != NULL) &&
479 			(inst->cur_fb->base_y.size >=
480 			frm_to_show->fb->base_y.size) &&
481 			(inst->cur_fb->base_c.size >=
482 			frm_to_show->fb->base_c.size)) {
483 			memcpy((void *)inst->cur_fb->base_y.va,
484 				(void *)frm_to_show->fb->base_y.va,
485 				frm_to_show->fb->base_y.size);
486 			memcpy((void *)inst->cur_fb->base_c.va,
487 				(void *)frm_to_show->fb->base_c.va,
488 				frm_to_show->fb->base_c.size);
489 		} else {
490 			/* After resolution change case, current CAPTURE buffer
491 			 * may have less buffer size than frm_to_show buffer
492 			 * size
493 			 */
494 			if (frm_to_show->fb != NULL)
495 				mtk_vcodec_err(inst,
496 					"inst->cur_fb->base_y.size=%zu, frm_to_show->fb.base_y.size=%zu",
497 					inst->cur_fb->base_y.size,
498 					frm_to_show->fb->base_y.size);
499 		}
500 		if (!vp9_is_sf_ref_fb(inst, inst->cur_fb)) {
501 			if (vsi->show_frame & BIT(0))
502 				vp9_add_to_fb_disp_list(inst, inst->cur_fb);
503 		}
504 	} else {
505 		if (!vp9_is_sf_ref_fb(inst, inst->cur_fb)) {
506 			if (vsi->show_frame & BIT(0))
507 				vp9_add_to_fb_disp_list(inst, frm_to_show->fb);
508 		}
509 	}
510 
511 	/* when ref_cnt ==0, move this fb to fb_free_list. v4l2 driver will
512 	 * clean fb_free_list
513 	 */
514 	if (vsi->frm_bufs[vsi->new_fb_idx].ref_cnt == 0) {
515 		if (!vp9_is_sf_ref_fb(
516 			inst, vsi->frm_bufs[vsi->new_fb_idx].buf.fb)) {
517 			struct vdec_fb *fb;
518 
519 			fb = vp9_rm_from_fb_use_list(inst,
520 			vsi->frm_bufs[vsi->new_fb_idx].buf.fb->base_y.va);
521 
522 			vp9_add_to_fb_free_list(inst, fb);
523 		} else {
524 			vp9_free_sf_ref_fb(
525 				vsi->frm_bufs[vsi->new_fb_idx].buf.fb);
526 		}
527 	}
528 
529 	/* if this super frame and it is not last sub-frame, get next fb for
530 	 * sub-frame decode
531 	 */
532 	if (vsi->sf_frm_cnt > 0 && vsi->sf_frm_idx != vsi->sf_frm_cnt - 1)
533 		vsi->sf_next_ref_fb_idx = vp9_get_sf_ref_fb(inst);
534 }
535 
vp9_wait_dec_end(struct vdec_vp9_inst * inst)536 static bool vp9_wait_dec_end(struct vdec_vp9_inst *inst)
537 {
538 	struct mtk_vcodec_ctx *ctx = inst->ctx;
539 
540 	mtk_vcodec_wait_for_done_ctx(inst->ctx,
541 			MTK_INST_IRQ_RECEIVED,
542 			WAIT_INTR_TIMEOUT_MS, 0);
543 
544 	if (ctx->irq_status & MTK_VDEC_IRQ_STATUS_DEC_SUCCESS)
545 		return true;
546 	else
547 		return false;
548 }
549 
vp9_alloc_inst(struct mtk_vcodec_ctx * ctx)550 static struct vdec_vp9_inst *vp9_alloc_inst(struct mtk_vcodec_ctx *ctx)
551 {
552 	int result;
553 	struct mtk_vcodec_mem mem;
554 	struct vdec_vp9_inst *inst;
555 
556 	memset(&mem, 0, sizeof(mem));
557 	mem.size = sizeof(struct vdec_vp9_inst);
558 	result = mtk_vcodec_mem_alloc(ctx, &mem);
559 	if (result)
560 		return NULL;
561 
562 	inst = mem.va;
563 	inst->mem = mem;
564 
565 	return inst;
566 }
567 
vp9_free_inst(struct vdec_vp9_inst * inst)568 static void vp9_free_inst(struct vdec_vp9_inst *inst)
569 {
570 	struct mtk_vcodec_mem mem;
571 
572 	mem = inst->mem;
573 	if (mem.va)
574 		mtk_vcodec_mem_free(inst->ctx, &mem);
575 }
576 
vp9_decode_end_proc(struct vdec_vp9_inst * inst)577 static bool vp9_decode_end_proc(struct vdec_vp9_inst *inst)
578 {
579 	struct vdec_vp9_vsi *vsi = inst->vsi;
580 	bool ret = false;
581 
582 	if (!vsi->show_existing_frame) {
583 		ret = vp9_wait_dec_end(inst);
584 		if (!ret) {
585 			mtk_vcodec_err(inst, "Decode failed, Decode Timeout @[%d]",
586 				vsi->frm_num);
587 			return false;
588 		}
589 
590 		if (vpu_dec_end(&inst->vpu)) {
591 			mtk_vcodec_err(inst, "vp9_dec_vpu_end failed");
592 			return false;
593 		}
594 		mtk_vcodec_debug(inst, "Decode Ok @%d (%d/%d)", vsi->frm_num,
595 				vsi->pic_w, vsi->pic_h);
596 	} else {
597 		mtk_vcodec_debug(inst, "Decode Ok @%d (show_existing_frame)",
598 				vsi->frm_num);
599 	}
600 
601 	vp9_swap_frm_bufs(inst);
602 	vsi->frm_num++;
603 	return true;
604 }
605 
vp9_is_last_sub_frm(struct vdec_vp9_inst * inst)606 static bool vp9_is_last_sub_frm(struct vdec_vp9_inst *inst)
607 {
608 	struct vdec_vp9_vsi *vsi = inst->vsi;
609 
610 	if (vsi->sf_frm_cnt <= 0 || vsi->sf_frm_idx == vsi->sf_frm_cnt)
611 		return true;
612 
613 	return false;
614 }
615 
vp9_rm_from_fb_disp_list(struct vdec_vp9_inst * inst)616 static struct vdec_fb *vp9_rm_from_fb_disp_list(struct vdec_vp9_inst *inst)
617 {
618 	struct vdec_fb_node *node;
619 	struct vdec_fb *fb = NULL;
620 
621 	node = list_first_entry_or_null(&inst->fb_disp_list,
622 					struct vdec_fb_node, list);
623 	if (node) {
624 		fb = (struct vdec_fb *)node->fb;
625 		fb->status |= FB_ST_DISPLAY;
626 		list_move_tail(&node->list, &inst->available_fb_node_list);
627 		mtk_vcodec_debug(inst, "[FB] get disp fb %p st=%d",
628 				 node->fb, fb->status);
629 	} else
630 		mtk_vcodec_debug(inst, "[FB] there is no disp fb");
631 
632 	return fb;
633 }
634 
vp9_add_to_fb_use_list(struct vdec_vp9_inst * inst,struct vdec_fb * fb)635 static bool vp9_add_to_fb_use_list(struct vdec_vp9_inst *inst,
636 			    struct vdec_fb *fb)
637 {
638 	struct vdec_fb_node *node;
639 
640 	if (!fb) {
641 		mtk_vcodec_debug(inst, "fb == NULL");
642 		return false;
643 	}
644 
645 	node = list_first_entry_or_null(&inst->available_fb_node_list,
646 					struct vdec_fb_node, list);
647 	if (node) {
648 		node->fb = fb;
649 		list_move_tail(&node->list, &inst->fb_use_list);
650 	} else {
651 		mtk_vcodec_err(inst, "No free fb node");
652 		return false;
653 	}
654 	return true;
655 }
656 
vp9_reset(struct vdec_vp9_inst * inst)657 static void vp9_reset(struct vdec_vp9_inst *inst)
658 {
659 	struct vdec_fb_node *node, *tmp;
660 
661 	list_for_each_entry_safe(node, tmp, &inst->fb_use_list, list)
662 		list_move_tail(&node->list, &inst->fb_free_list);
663 
664 	vp9_free_all_sf_ref_fb(inst);
665 	inst->vsi->sf_next_ref_fb_idx = vp9_get_sf_ref_fb(inst);
666 
667 	if (vpu_dec_reset(&inst->vpu))
668 		mtk_vcodec_err(inst, "vp9_dec_vpu_reset failed");
669 
670 	/* Set the va again, since vpu_dec_reset will clear mv_buf in vpu */
671 	inst->vsi->mv_buf.va = (unsigned long)inst->mv_buf.va;
672 	inst->vsi->mv_buf.pa = (unsigned long)inst->mv_buf.dma_addr;
673 	inst->vsi->mv_buf.sz = (unsigned long)inst->mv_buf.size;
674 
675 	/* Set the va again, since vpu_dec_reset will clear seg_id_buf in vpu */
676 	inst->vsi->seg_id_buf.va = (unsigned long)inst->seg_id_buf.va;
677 	inst->vsi->seg_id_buf.pa = (unsigned long)inst->seg_id_buf.dma_addr;
678 	inst->vsi->seg_id_buf.sz = (unsigned long)inst->seg_id_buf.size;
679 
680 }
681 
init_all_fb_lists(struct vdec_vp9_inst * inst)682 static void init_all_fb_lists(struct vdec_vp9_inst *inst)
683 {
684 	int i;
685 
686 	INIT_LIST_HEAD(&inst->available_fb_node_list);
687 	INIT_LIST_HEAD(&inst->fb_use_list);
688 	INIT_LIST_HEAD(&inst->fb_free_list);
689 	INIT_LIST_HEAD(&inst->fb_disp_list);
690 
691 	for (i = 0; i < ARRAY_SIZE(inst->dec_fb); i++) {
692 		INIT_LIST_HEAD(&inst->dec_fb[i].list);
693 		inst->dec_fb[i].fb = NULL;
694 		list_add_tail(&inst->dec_fb[i].list,
695 			      &inst->available_fb_node_list);
696 	}
697 }
698 
get_pic_info(struct vdec_vp9_inst * inst,struct vdec_pic_info * pic)699 static void get_pic_info(struct vdec_vp9_inst *inst, struct vdec_pic_info *pic)
700 {
701 	pic->fb_sz[0] = inst->vsi->buf_sz_y_bs + inst->vsi->buf_len_sz_y;
702 	pic->fb_sz[1] = inst->vsi->buf_sz_c_bs + inst->vsi->buf_len_sz_c;
703 
704 	pic->pic_w = inst->vsi->pic_w;
705 	pic->pic_h = inst->vsi->pic_h;
706 	pic->buf_w = inst->vsi->buf_w;
707 	pic->buf_h = inst->vsi->buf_h;
708 
709 	mtk_vcodec_debug(inst, "pic(%d, %d), buf(%d, %d)",
710 		 pic->pic_w, pic->pic_h, pic->buf_w, pic->buf_h);
711 	mtk_vcodec_debug(inst, "fb size: Y(%d), C(%d)",
712 		pic->fb_sz[0],
713 		pic->fb_sz[1]);
714 }
715 
get_disp_fb(struct vdec_vp9_inst * inst,struct vdec_fb ** out_fb)716 static void get_disp_fb(struct vdec_vp9_inst *inst, struct vdec_fb **out_fb)
717 {
718 
719 	*out_fb = vp9_rm_from_fb_disp_list(inst);
720 	if (*out_fb)
721 		(*out_fb)->status |= FB_ST_DISPLAY;
722 }
723 
get_free_fb(struct vdec_vp9_inst * inst,struct vdec_fb ** out_fb)724 static void get_free_fb(struct vdec_vp9_inst *inst, struct vdec_fb **out_fb)
725 {
726 	struct vdec_fb_node *node;
727 	struct vdec_fb *fb = NULL;
728 
729 	node = list_first_entry_or_null(&inst->fb_free_list,
730 					struct vdec_fb_node, list);
731 	if (node) {
732 		list_move_tail(&node->list, &inst->available_fb_node_list);
733 		fb = (struct vdec_fb *)node->fb;
734 		fb->status |= FB_ST_FREE;
735 		mtk_vcodec_debug(inst, "[FB] get free fb %p st=%d",
736 				 node->fb, fb->status);
737 	} else {
738 		mtk_vcodec_debug(inst, "[FB] there is no free fb");
739 	}
740 
741 	*out_fb = fb;
742 }
743 
validate_vsi_array_indexes(struct vdec_vp9_inst * inst,struct vdec_vp9_vsi * vsi)744 static int validate_vsi_array_indexes(struct vdec_vp9_inst *inst,
745 		struct vdec_vp9_vsi *vsi) {
746 	if (vsi->sf_frm_idx >= VP9_MAX_FRM_BUF_NUM - 1) {
747 		mtk_vcodec_err(inst, "Invalid vsi->sf_frm_idx=%u.",
748 				vsi->sf_frm_idx);
749 		return -EIO;
750 	}
751 	if (vsi->frm_to_show_idx >= VP9_MAX_FRM_BUF_NUM) {
752 		mtk_vcodec_err(inst, "Invalid vsi->frm_to_show_idx=%u.",
753 				vsi->frm_to_show_idx);
754 		return -EIO;
755 	}
756 	if (vsi->new_fb_idx >= VP9_MAX_FRM_BUF_NUM) {
757 		mtk_vcodec_err(inst, "Invalid vsi->new_fb_idx=%u.",
758 				vsi->new_fb_idx);
759 		return -EIO;
760 	}
761 	return 0;
762 }
763 
vdec_vp9_deinit(void * h_vdec)764 static void vdec_vp9_deinit(void *h_vdec)
765 {
766 	struct vdec_vp9_inst *inst = (struct vdec_vp9_inst *)h_vdec;
767 	struct mtk_vcodec_mem *mem;
768 	int ret = 0;
769 
770 	ret = vpu_dec_deinit(&inst->vpu);
771 	if (ret)
772 		mtk_vcodec_err(inst, "vpu_dec_deinit failed");
773 
774 	mem = &inst->mv_buf;
775 	if (mem->va)
776 		mtk_vcodec_mem_free(inst->ctx, mem);
777 
778 	mem = &inst->seg_id_buf;
779 	if (mem->va)
780 		mtk_vcodec_mem_free(inst->ctx, mem);
781 
782 	vp9_free_all_sf_ref_fb(inst);
783 	vp9_free_inst(inst);
784 }
785 
vdec_vp9_init(struct mtk_vcodec_ctx * ctx)786 static int vdec_vp9_init(struct mtk_vcodec_ctx *ctx)
787 {
788 	struct vdec_vp9_inst *inst;
789 
790 	inst = vp9_alloc_inst(ctx);
791 	if (!inst)
792 		return -ENOMEM;
793 
794 	inst->total_frm_cnt = 0;
795 	inst->ctx = ctx;
796 
797 	inst->vpu.id = IPI_VDEC_VP9;
798 	inst->vpu.ctx = ctx;
799 
800 	if (vpu_dec_init(&inst->vpu)) {
801 		mtk_vcodec_err(inst, "vp9_dec_vpu_init failed");
802 		goto err_deinit_inst;
803 	}
804 
805 	inst->vsi = (struct vdec_vp9_vsi *)inst->vpu.vsi;
806 
807 	inst->vsi->show_frame |= BIT(3);
808 
809 	init_all_fb_lists(inst);
810 
811 	ctx->drv_handle = inst;
812 	return 0;
813 
814 err_deinit_inst:
815 	vp9_free_inst(inst);
816 
817 	return -EINVAL;
818 }
819 
vdec_vp9_decode(void * h_vdec,struct mtk_vcodec_mem * bs,struct vdec_fb * fb,bool * res_chg)820 static int vdec_vp9_decode(void *h_vdec, struct mtk_vcodec_mem *bs,
821 			   struct vdec_fb *fb, bool *res_chg)
822 {
823 	int ret = 0;
824 	struct vdec_vp9_inst *inst = (struct vdec_vp9_inst *)h_vdec;
825 	struct vdec_vp9_vsi *vsi = inst->vsi;
826 	u32 data[3];
827 	int i;
828 
829 	*res_chg = false;
830 
831 	if ((bs == NULL) && (fb == NULL)) {
832 		mtk_vcodec_debug(inst, "[EOS]");
833 		vp9_reset(inst);
834 		return ret;
835 	}
836 
837 	if (bs == NULL) {
838 		mtk_vcodec_err(inst, "bs == NULL");
839 		return -EINVAL;
840 	}
841 
842 	mtk_vcodec_debug(inst, "Input BS Size = %zu", bs->size);
843 
844 	while (1) {
845 		struct vdec_fb *cur_fb = NULL;
846 
847 		data[0] = *((unsigned int *)bs->va);
848 		data[1] = *((unsigned int *)(bs->va + 4));
849 		data[2] = *((unsigned int *)(bs->va + 8));
850 
851 		vsi->bs = *bs;
852 
853 		if (fb)
854 			vsi->fb = *fb;
855 
856 		if (!vsi->sf_init) {
857 			unsigned int sf_bs_sz;
858 			unsigned int sf_bs_off;
859 			unsigned char *sf_bs_src;
860 			unsigned char *sf_bs_dst;
861 
862 			sf_bs_sz = bs->size > VP9_SUPER_FRAME_BS_SZ ?
863 					VP9_SUPER_FRAME_BS_SZ : bs->size;
864 			sf_bs_off = VP9_SUPER_FRAME_BS_SZ - sf_bs_sz;
865 			sf_bs_src = bs->va + bs->size - sf_bs_sz;
866 			sf_bs_dst = vsi->sf_bs_buf + sf_bs_off;
867 			memcpy(sf_bs_dst, sf_bs_src, sf_bs_sz);
868 		} else {
869 			if ((vsi->sf_frm_cnt > 0) &&
870 				(vsi->sf_frm_idx < vsi->sf_frm_cnt)) {
871 				unsigned int idx = vsi->sf_frm_idx;
872 
873 				memcpy((void *)bs->va,
874 					(void *)(bs->va +
875 					vsi->sf_frm_offset[idx]),
876 					vsi->sf_frm_sz[idx]);
877 			}
878 		}
879 
880 		if (!(vsi->show_frame & BIT(4)))
881 			memset(inst->seg_id_buf.va, 0, inst->seg_id_buf.size);
882 
883 		ret = vpu_dec_start(&inst->vpu, data, 3);
884 		if (ret) {
885 			mtk_vcodec_err(inst, "vpu_dec_start failed");
886 			goto DECODE_ERROR;
887 		}
888 
889 		if (vsi->show_frame & BIT(1)) {
890 			memset(inst->seg_id_buf.va, 0, inst->seg_id_buf.size);
891 
892 			if (vsi->show_frame & BIT(2)) {
893 				ret = vpu_dec_start(&inst->vpu, NULL, 0);
894 				if (ret) {
895 					mtk_vcodec_err(inst, "vpu trig decoder failed");
896 					goto DECODE_ERROR;
897 				}
898 			}
899 		}
900 
901 		ret = validate_vsi_array_indexes(inst, vsi);
902 		if (ret) {
903 			mtk_vcodec_err(inst, "Invalid values from VPU.");
904 			goto DECODE_ERROR;
905 		}
906 
907 		if (vsi->resolution_changed) {
908 			if (!vp9_alloc_work_buf(inst)) {
909 				ret = -EIO;
910 				goto DECODE_ERROR;
911 			}
912 		}
913 
914 		if (vsi->sf_frm_cnt > 0) {
915 			cur_fb = &vsi->sf_ref_fb[vsi->sf_next_ref_fb_idx].fb;
916 
917 			if (vsi->sf_frm_idx < vsi->sf_frm_cnt)
918 				inst->cur_fb = cur_fb;
919 			else
920 				inst->cur_fb = fb;
921 		} else {
922 			inst->cur_fb = fb;
923 		}
924 
925 		vsi->frm_bufs[vsi->new_fb_idx].buf.fb = inst->cur_fb;
926 		if (!vp9_is_sf_ref_fb(inst, inst->cur_fb))
927 			vp9_add_to_fb_use_list(inst, inst->cur_fb);
928 
929 		mtk_vcodec_debug(inst, "[#pic %d]", vsi->frm_num);
930 
931 		if (vsi->show_existing_frame)
932 			mtk_vcodec_debug(inst,
933 				"drv->new_fb_idx=%d, drv->frm_to_show_idx=%d",
934 				vsi->new_fb_idx, vsi->frm_to_show_idx);
935 
936 		if (vsi->show_existing_frame && (vsi->frm_to_show_idx <
937 					VP9_MAX_FRM_BUF_NUM)) {
938 			mtk_vcodec_debug(inst,
939 				"Skip Decode drv->new_fb_idx=%d, drv->frm_to_show_idx=%d",
940 				vsi->new_fb_idx, vsi->frm_to_show_idx);
941 
942 			vp9_ref_cnt_fb(inst, &vsi->new_fb_idx,
943 					vsi->frm_to_show_idx);
944 		}
945 
946 		/* VPU assign the buffer pointer in its address space,
947 		 * reassign here
948 		 */
949 		for (i = 0; i < ARRAY_SIZE(vsi->frm_refs); i++) {
950 			unsigned int idx = vsi->frm_refs[i].idx;
951 
952 			vsi->frm_refs[i].buf = &vsi->frm_bufs[idx].buf;
953 		}
954 
955 		if (vsi->resolution_changed) {
956 			*res_chg = true;
957 			mtk_vcodec_debug(inst, "VDEC_ST_RESOLUTION_CHANGED");
958 
959 			ret = 0;
960 			goto DECODE_ERROR;
961 		}
962 
963 		if (!vp9_decode_end_proc(inst)) {
964 			mtk_vcodec_err(inst, "vp9_decode_end_proc");
965 			ret = -EINVAL;
966 			goto DECODE_ERROR;
967 		}
968 
969 		if (vp9_is_last_sub_frm(inst))
970 			break;
971 
972 	}
973 	inst->total_frm_cnt++;
974 
975 DECODE_ERROR:
976 	if (ret < 0)
977 		vp9_add_to_fb_free_list(inst, fb);
978 
979 	return ret;
980 }
981 
get_crop_info(struct vdec_vp9_inst * inst,struct v4l2_rect * cr)982 static void get_crop_info(struct vdec_vp9_inst *inst, struct v4l2_rect *cr)
983 {
984 	cr->left = 0;
985 	cr->top = 0;
986 	cr->width = inst->vsi->pic_w;
987 	cr->height = inst->vsi->pic_h;
988 	mtk_vcodec_debug(inst, "get crop info l=%d, t=%d, w=%d, h=%d\n",
989 			 cr->left, cr->top, cr->width, cr->height);
990 }
991 
vdec_vp9_get_param(void * h_vdec,enum vdec_get_param_type type,void * out)992 static int vdec_vp9_get_param(void *h_vdec, enum vdec_get_param_type type,
993 			      void *out)
994 {
995 	struct vdec_vp9_inst *inst = (struct vdec_vp9_inst *)h_vdec;
996 	int ret = 0;
997 
998 	switch (type) {
999 	case GET_PARAM_DISP_FRAME_BUFFER:
1000 		get_disp_fb(inst, out);
1001 		break;
1002 	case GET_PARAM_FREE_FRAME_BUFFER:
1003 		get_free_fb(inst, out);
1004 		break;
1005 	case GET_PARAM_PIC_INFO:
1006 		get_pic_info(inst, out);
1007 		break;
1008 	case GET_PARAM_DPB_SIZE:
1009 		*((unsigned int *)out) = MAX_VP9_DPB_SIZE;
1010 		break;
1011 	case GET_PARAM_CROP_INFO:
1012 		get_crop_info(inst, out);
1013 		break;
1014 	default:
1015 		mtk_vcodec_err(inst, "not supported param type %d", type);
1016 		ret = -EINVAL;
1017 		break;
1018 	}
1019 
1020 	return ret;
1021 }
1022 
1023 const struct vdec_common_if vdec_vp9_if = {
1024 	.init		= vdec_vp9_init,
1025 	.decode		= vdec_vp9_decode,
1026 	.get_param	= vdec_vp9_get_param,
1027 	.deinit		= vdec_vp9_deinit,
1028 };
1029