]> asedeno.scripts.mit.edu Git - linux.git/blob - drivers/media/platform/mtk-vcodec/vdec/vdec_h264_if.c
Merge tag 'v5.3-rc4' into patchwork
[linux.git] / drivers / media / platform / mtk-vcodec / vdec / vdec_h264_if.c
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * Copyright (c) 2016 MediaTek Inc.
4  * Author: PC Chen <pc.chen@mediatek.com>
5  */
6
7 #include <linux/module.h>
8 #include <linux/slab.h>
9
10 #include "../vdec_drv_if.h"
11 #include "../mtk_vcodec_util.h"
12 #include "../mtk_vcodec_dec.h"
13 #include "../mtk_vcodec_intr.h"
14 #include "../vdec_vpu_if.h"
15 #include "../vdec_drv_base.h"
16
17 #define NAL_NON_IDR_SLICE                       0x01
18 #define NAL_IDR_SLICE                           0x05
19 #define NAL_H264_PPS                            0x08
20 #define NAL_TYPE(value)                         ((value) & 0x1F)
21
22 #define BUF_PREDICTION_SZ                       (32 * 1024)
23
24 #define MB_UNIT_LEN                             16
25
26 /* motion vector size (bytes) for every macro block */
27 #define HW_MB_STORE_SZ                          64
28
29 #define H264_MAX_FB_NUM                         17
30 #define HDR_PARSING_BUF_SZ                      1024
31
32 #define DEC_ERR_RET(ret)                        ((ret) >> 16)
33 #define H264_ERR_NOT_VALID                      3
34
35 /**
36  * struct h264_fb - h264 decode frame buffer information
37  * @vdec_fb_va  : virtual address of struct vdec_fb
38  * @y_fb_dma    : dma address of Y frame buffer (luma)
39  * @c_fb_dma    : dma address of C frame buffer (chroma)
40  * @poc         : picture order count of frame buffer
41  * @reserved    : for 8 bytes alignment
42  */
43 struct h264_fb {
44         uint64_t vdec_fb_va;
45         uint64_t y_fb_dma;
46         uint64_t c_fb_dma;
47         int32_t poc;
48         uint32_t reserved;
49 };
50
51 /**
52  * struct h264_ring_fb_list - ring frame buffer list
53  * @fb_list   : frame buffer array
54  * @read_idx  : read index
55  * @write_idx : write index
56  * @count     : buffer count in list
57  * @reserved  : for 8 bytes alignment
58  */
59 struct h264_ring_fb_list {
60         struct h264_fb fb_list[H264_MAX_FB_NUM];
61         unsigned int read_idx;
62         unsigned int write_idx;
63         unsigned int count;
64         unsigned int reserved;
65 };
66
67 /**
68  * struct vdec_h264_dec_info - decode information
69  * @dpb_sz              : decoding picture buffer size
70  * @resolution_changed  : resolution change happen
71  * @realloc_mv_buf      : flag to notify driver to re-allocate mv buffer
72  * @reserved            : for 8 bytes alignment
73  * @bs_dma              : Input bit-stream buffer dma address
74  * @y_fb_dma            : Y frame buffer dma address
75  * @c_fb_dma            : C frame buffer dma address
76  * @vdec_fb_va          : VDEC frame buffer struct virtual address
77  */
78 struct vdec_h264_dec_info {
79         uint32_t dpb_sz;
80         uint32_t resolution_changed;
81         uint32_t realloc_mv_buf;
82         uint32_t reserved;
83         uint64_t bs_dma;
84         uint64_t y_fb_dma;
85         uint64_t c_fb_dma;
86         uint64_t vdec_fb_va;
87 };
88
89 /**
90  * struct vdec_h264_vsi - shared memory for decode information exchange
91  *                        between VPU and Host.
92  *                        The memory is allocated by VPU then mapping to Host
93  *                        in vpu_dec_init() and freed in vpu_dec_deinit()
94  *                        by VPU.
95  *                        AP-W/R : AP is writer/reader on this item
96  *                        VPU-W/R: VPU is write/reader on this item
97  * @hdr_buf      : Header parsing buffer (AP-W, VPU-R)
98  * @pred_buf_dma : HW working predication buffer dma address (AP-W, VPU-R)
99  * @mv_buf_dma   : HW working motion vector buffer dma address (AP-W, VPU-R)
100  * @list_free    : free frame buffer ring list (AP-W/R, VPU-W)
101  * @list_disp    : display frame buffer ring list (AP-R, VPU-W)
102  * @dec          : decode information (AP-R, VPU-W)
103  * @pic          : picture information (AP-R, VPU-W)
104  * @crop         : crop information (AP-R, VPU-W)
105  */
106 struct vdec_h264_vsi {
107         unsigned char hdr_buf[HDR_PARSING_BUF_SZ];
108         uint64_t pred_buf_dma;
109         uint64_t mv_buf_dma[H264_MAX_FB_NUM];
110         struct h264_ring_fb_list list_free;
111         struct h264_ring_fb_list list_disp;
112         struct vdec_h264_dec_info dec;
113         struct vdec_pic_info pic;
114         struct v4l2_rect crop;
115 };
116
117 /**
118  * struct vdec_h264_inst - h264 decoder instance
119  * @num_nalu : how many nalus be decoded
120  * @ctx      : point to mtk_vcodec_ctx
121  * @pred_buf : HW working predication buffer
122  * @mv_buf   : HW working motion vector buffer
123  * @vpu      : VPU instance
124  * @vsi      : VPU shared information
125  */
126 struct vdec_h264_inst {
127         unsigned int num_nalu;
128         struct mtk_vcodec_ctx *ctx;
129         struct mtk_vcodec_mem pred_buf;
130         struct mtk_vcodec_mem mv_buf[H264_MAX_FB_NUM];
131         struct vdec_vpu_inst vpu;
132         struct vdec_h264_vsi *vsi;
133 };
134
135 static unsigned int get_mv_buf_size(unsigned int width, unsigned int height)
136 {
137         return HW_MB_STORE_SZ * (width/MB_UNIT_LEN) * (height/MB_UNIT_LEN);
138 }
139
140 static int allocate_predication_buf(struct vdec_h264_inst *inst)
141 {
142         int err = 0;
143
144         inst->pred_buf.size = BUF_PREDICTION_SZ;
145         err = mtk_vcodec_mem_alloc(inst->ctx, &inst->pred_buf);
146         if (err) {
147                 mtk_vcodec_err(inst, "failed to allocate ppl buf");
148                 return err;
149         }
150
151         inst->vsi->pred_buf_dma = inst->pred_buf.dma_addr;
152         return 0;
153 }
154
155 static void free_predication_buf(struct vdec_h264_inst *inst)
156 {
157         struct mtk_vcodec_mem *mem = NULL;
158
159         mtk_vcodec_debug_enter(inst);
160
161         inst->vsi->pred_buf_dma = 0;
162         mem = &inst->pred_buf;
163         if (mem->va)
164                 mtk_vcodec_mem_free(inst->ctx, mem);
165 }
166
167 static int alloc_mv_buf(struct vdec_h264_inst *inst, struct vdec_pic_info *pic)
168 {
169         int i;
170         int err;
171         struct mtk_vcodec_mem *mem = NULL;
172         unsigned int buf_sz = get_mv_buf_size(pic->buf_w, pic->buf_h);
173
174         for (i = 0; i < H264_MAX_FB_NUM; i++) {
175                 mem = &inst->mv_buf[i];
176                 if (mem->va)
177                         mtk_vcodec_mem_free(inst->ctx, mem);
178                 mem->size = buf_sz;
179                 err = mtk_vcodec_mem_alloc(inst->ctx, mem);
180                 if (err) {
181                         mtk_vcodec_err(inst, "failed to allocate mv buf");
182                         return err;
183                 }
184                 inst->vsi->mv_buf_dma[i] = mem->dma_addr;
185         }
186
187         return 0;
188 }
189
190 static void free_mv_buf(struct vdec_h264_inst *inst)
191 {
192         int i;
193         struct mtk_vcodec_mem *mem = NULL;
194
195         for (i = 0; i < H264_MAX_FB_NUM; i++) {
196                 inst->vsi->mv_buf_dma[i] = 0;
197                 mem = &inst->mv_buf[i];
198                 if (mem->va)
199                         mtk_vcodec_mem_free(inst->ctx, mem);
200         }
201 }
202
203 static int check_list_validity(struct vdec_h264_inst *inst, bool disp_list)
204 {
205         struct h264_ring_fb_list *list;
206
207         list = disp_list ? &inst->vsi->list_disp : &inst->vsi->list_free;
208
209         if (list->count > H264_MAX_FB_NUM ||
210             list->read_idx >= H264_MAX_FB_NUM ||
211             list->write_idx >= H264_MAX_FB_NUM) {
212                 mtk_vcodec_err(inst, "%s list err: cnt=%d r_idx=%d w_idx=%d",
213                                disp_list ? "disp" : "free", list->count,
214                                list->read_idx, list->write_idx);
215                 return -EINVAL;
216         }
217
218         return 0;
219 }
220
221 static void put_fb_to_free(struct vdec_h264_inst *inst, struct vdec_fb *fb)
222 {
223         struct h264_ring_fb_list *list;
224
225         if (fb) {
226                 if (check_list_validity(inst, false))
227                         return;
228
229                 list = &inst->vsi->list_free;
230                 if (list->count == H264_MAX_FB_NUM) {
231                         mtk_vcodec_err(inst, "[FB] put fb free_list full");
232                         return;
233                 }
234
235                 mtk_vcodec_debug(inst, "[FB] put fb into free_list @(%p, %llx)",
236                                  fb->base_y.va, (u64)fb->base_y.dma_addr);
237
238                 list->fb_list[list->write_idx].vdec_fb_va = (u64)(uintptr_t)fb;
239                 list->write_idx = (list->write_idx == H264_MAX_FB_NUM - 1) ?
240                                   0 : list->write_idx + 1;
241                 list->count++;
242         }
243 }
244
245 static void get_pic_info(struct vdec_h264_inst *inst,
246                          struct vdec_pic_info *pic)
247 {
248         *pic = inst->vsi->pic;
249         mtk_vcodec_debug(inst, "pic(%d, %d), buf(%d, %d)",
250                          pic->pic_w, pic->pic_h, pic->buf_w, pic->buf_h);
251         mtk_vcodec_debug(inst, "fb size: Y(%d), C(%d)",
252                          pic->fb_sz[0], pic->fb_sz[1]);
253 }
254
255 static void get_crop_info(struct vdec_h264_inst *inst, struct v4l2_rect *cr)
256 {
257         cr->left = inst->vsi->crop.left;
258         cr->top = inst->vsi->crop.top;
259         cr->width = inst->vsi->crop.width;
260         cr->height = inst->vsi->crop.height;
261
262         mtk_vcodec_debug(inst, "l=%d, t=%d, w=%d, h=%d",
263                          cr->left, cr->top, cr->width, cr->height);
264 }
265
266 static void get_dpb_size(struct vdec_h264_inst *inst, unsigned int *dpb_sz)
267 {
268         *dpb_sz = inst->vsi->dec.dpb_sz;
269         mtk_vcodec_debug(inst, "sz=%d", *dpb_sz);
270 }
271
272 static int vdec_h264_init(struct mtk_vcodec_ctx *ctx)
273 {
274         struct vdec_h264_inst *inst = NULL;
275         int err;
276
277         inst = kzalloc(sizeof(*inst), GFP_KERNEL);
278         if (!inst)
279                 return -ENOMEM;
280
281         inst->ctx = ctx;
282
283         inst->vpu.id = IPI_VDEC_H264;
284         inst->vpu.dev = ctx->dev->vpu_plat_dev;
285         inst->vpu.ctx = ctx;
286         inst->vpu.handler = vpu_dec_ipi_handler;
287
288         err = vpu_dec_init(&inst->vpu);
289         if (err) {
290                 mtk_vcodec_err(inst, "vdec_h264 init err=%d", err);
291                 goto error_free_inst;
292         }
293
294         inst->vsi = (struct vdec_h264_vsi *)inst->vpu.vsi;
295         err = allocate_predication_buf(inst);
296         if (err)
297                 goto error_deinit;
298
299         mtk_vcodec_debug(inst, "H264 Instance >> %p", inst);
300
301         ctx->drv_handle = inst;
302         return 0;
303
304 error_deinit:
305         vpu_dec_deinit(&inst->vpu);
306
307 error_free_inst:
308         kfree(inst);
309         return err;
310 }
311
312 static void vdec_h264_deinit(void *h_vdec)
313 {
314         struct vdec_h264_inst *inst = (struct vdec_h264_inst *)h_vdec;
315
316         mtk_vcodec_debug_enter(inst);
317
318         vpu_dec_deinit(&inst->vpu);
319         free_predication_buf(inst);
320         free_mv_buf(inst);
321
322         kfree(inst);
323 }
324
325 static int find_start_code(unsigned char *data, unsigned int data_sz)
326 {
327         if (data_sz > 3 && data[0] == 0 && data[1] == 0 && data[2] == 1)
328                 return 3;
329
330         if (data_sz > 4 && data[0] == 0 && data[1] == 0 && data[2] == 0 &&
331             data[3] == 1)
332                 return 4;
333
334         return -1;
335 }
336
337 static int vdec_h264_decode(void *h_vdec, struct mtk_vcodec_mem *bs,
338                             struct vdec_fb *fb, bool *res_chg)
339 {
340         struct vdec_h264_inst *inst = (struct vdec_h264_inst *)h_vdec;
341         struct vdec_vpu_inst *vpu = &inst->vpu;
342         int nal_start_idx = 0;
343         int err = 0;
344         unsigned int nal_start;
345         unsigned int nal_type;
346         unsigned char *buf;
347         unsigned int buf_sz;
348         unsigned int data[2];
349         uint64_t vdec_fb_va = (u64)(uintptr_t)fb;
350         uint64_t y_fb_dma = fb ? (u64)fb->base_y.dma_addr : 0;
351         uint64_t c_fb_dma = fb ? (u64)fb->base_c.dma_addr : 0;
352
353         mtk_vcodec_debug(inst, "+ [%d] FB y_dma=%llx c_dma=%llx va=%p",
354                          ++inst->num_nalu, y_fb_dma, c_fb_dma, fb);
355
356         /* bs NULL means flush decoder */
357         if (bs == NULL)
358                 return vpu_dec_reset(vpu);
359
360         buf = (unsigned char *)bs->va;
361         buf_sz = bs->size;
362         nal_start_idx = find_start_code(buf, buf_sz);
363         if (nal_start_idx < 0) {
364                 mtk_vcodec_err(inst, "invalid nal start code");
365                 err = -EIO;
366                 goto err_free_fb_out;
367         }
368
369         nal_start = buf[nal_start_idx];
370         nal_type = NAL_TYPE(buf[nal_start_idx]);
371         mtk_vcodec_debug(inst, "\n + NALU[%d] type %d +\n", inst->num_nalu,
372                          nal_type);
373
374         if (nal_type == NAL_H264_PPS) {
375                 buf_sz -= nal_start_idx;
376                 if (buf_sz > HDR_PARSING_BUF_SZ) {
377                         err = -EILSEQ;
378                         goto err_free_fb_out;
379                 }
380                 memcpy(inst->vsi->hdr_buf, buf + nal_start_idx, buf_sz);
381         }
382
383         inst->vsi->dec.bs_dma = (uint64_t)bs->dma_addr;
384         inst->vsi->dec.y_fb_dma = y_fb_dma;
385         inst->vsi->dec.c_fb_dma = c_fb_dma;
386         inst->vsi->dec.vdec_fb_va = vdec_fb_va;
387
388         data[0] = buf_sz;
389         data[1] = nal_start;
390         err = vpu_dec_start(vpu, data, 2);
391         if (err) {
392                 if (err > 0 && (DEC_ERR_RET(err) == H264_ERR_NOT_VALID)) {
393                         mtk_vcodec_err(inst, "- error bitstream - err = %d -",
394                                        err);
395                         err = -EIO;
396                 }
397                 goto err_free_fb_out;
398         }
399
400         *res_chg = inst->vsi->dec.resolution_changed;
401         if (*res_chg) {
402                 struct vdec_pic_info pic;
403
404                 mtk_vcodec_debug(inst, "- resolution changed -");
405                 get_pic_info(inst, &pic);
406
407                 if (inst->vsi->dec.realloc_mv_buf) {
408                         err = alloc_mv_buf(inst, &pic);
409                         if (err)
410                                 goto err_free_fb_out;
411                 }
412         }
413
414         if (nal_type == NAL_NON_IDR_SLICE || nal_type == NAL_IDR_SLICE) {
415                 /* wait decoder done interrupt */
416                 err = mtk_vcodec_wait_for_done_ctx(inst->ctx,
417                                                    MTK_INST_IRQ_RECEIVED,
418                                                    WAIT_INTR_TIMEOUT_MS);
419                 if (err)
420                         goto err_free_fb_out;
421
422                 vpu_dec_end(vpu);
423         }
424
425         mtk_vcodec_debug(inst, "\n - NALU[%d] type=%d -\n", inst->num_nalu,
426                          nal_type);
427         return 0;
428
429 err_free_fb_out:
430         put_fb_to_free(inst, fb);
431         mtk_vcodec_err(inst, "\n - NALU[%d] err=%d -\n", inst->num_nalu, err);
432         return err;
433 }
434
435 static void vdec_h264_get_fb(struct vdec_h264_inst *inst,
436                              struct h264_ring_fb_list *list,
437                              bool disp_list, struct vdec_fb **out_fb)
438 {
439         struct vdec_fb *fb;
440
441         if (check_list_validity(inst, disp_list))
442                 return;
443
444         if (list->count == 0) {
445                 mtk_vcodec_debug(inst, "[FB] there is no %s fb",
446                                  disp_list ? "disp" : "free");
447                 *out_fb = NULL;
448                 return;
449         }
450
451         fb = (struct vdec_fb *)
452                 (uintptr_t)list->fb_list[list->read_idx].vdec_fb_va;
453         fb->status |= (disp_list ? FB_ST_DISPLAY : FB_ST_FREE);
454
455         *out_fb = fb;
456         mtk_vcodec_debug(inst, "[FB] get %s fb st=%d poc=%d %llx",
457                          disp_list ? "disp" : "free",
458                          fb->status, list->fb_list[list->read_idx].poc,
459                          list->fb_list[list->read_idx].vdec_fb_va);
460
461         list->read_idx = (list->read_idx == H264_MAX_FB_NUM - 1) ?
462                          0 : list->read_idx + 1;
463         list->count--;
464 }
465
466 static int vdec_h264_get_param(void *h_vdec, enum vdec_get_param_type type,
467                                void *out)
468 {
469         struct vdec_h264_inst *inst = (struct vdec_h264_inst *)h_vdec;
470
471         switch (type) {
472         case GET_PARAM_DISP_FRAME_BUFFER:
473                 vdec_h264_get_fb(inst, &inst->vsi->list_disp, true, out);
474                 break;
475
476         case GET_PARAM_FREE_FRAME_BUFFER:
477                 vdec_h264_get_fb(inst, &inst->vsi->list_free, false, out);
478                 break;
479
480         case GET_PARAM_PIC_INFO:
481                 get_pic_info(inst, out);
482                 break;
483
484         case GET_PARAM_DPB_SIZE:
485                 get_dpb_size(inst, out);
486                 break;
487
488         case GET_PARAM_CROP_INFO:
489                 get_crop_info(inst, out);
490                 break;
491
492         default:
493                 mtk_vcodec_err(inst, "invalid get parameter type=%d", type);
494                 return -EINVAL;
495         }
496
497         return 0;
498 }
499
500 const struct vdec_common_if vdec_h264_if = {
501         .init           = vdec_h264_init,
502         .decode         = vdec_h264_decode,
503         .get_param      = vdec_h264_get_param,
504         .deinit         = vdec_h264_deinit,
505 };