1*fbb6c848SEzequiel Garcia // SPDX-License-Identifier: GPL-2.0
2*fbb6c848SEzequiel Garcia /*
3*fbb6c848SEzequiel Garcia * Hantro VPU codec driver
4*fbb6c848SEzequiel Garcia *
5*fbb6c848SEzequiel Garcia * Copyright (C) 2018 Rockchip Electronics Co., Ltd.
6*fbb6c848SEzequiel Garcia */
7*fbb6c848SEzequiel Garcia
8*fbb6c848SEzequiel Garcia #include "hantro.h"
9*fbb6c848SEzequiel Garcia
10*fbb6c848SEzequiel Garcia /*
11*fbb6c848SEzequiel Garcia * probs table with packed
12*fbb6c848SEzequiel Garcia */
13*fbb6c848SEzequiel Garcia struct vp8_prob_tbl_packed {
14*fbb6c848SEzequiel Garcia u8 prob_mb_skip_false;
15*fbb6c848SEzequiel Garcia u8 prob_intra;
16*fbb6c848SEzequiel Garcia u8 prob_ref_last;
17*fbb6c848SEzequiel Garcia u8 prob_ref_golden;
18*fbb6c848SEzequiel Garcia u8 prob_segment[3];
19*fbb6c848SEzequiel Garcia u8 padding0;
20*fbb6c848SEzequiel Garcia
21*fbb6c848SEzequiel Garcia u8 prob_luma_16x16_pred_mode[4];
22*fbb6c848SEzequiel Garcia u8 prob_chroma_pred_mode[3];
23*fbb6c848SEzequiel Garcia u8 padding1;
24*fbb6c848SEzequiel Garcia
25*fbb6c848SEzequiel Garcia /* mv prob */
26*fbb6c848SEzequiel Garcia u8 prob_mv_context[2][V4L2_VP8_MV_PROB_CNT];
27*fbb6c848SEzequiel Garcia u8 padding2[2];
28*fbb6c848SEzequiel Garcia
29*fbb6c848SEzequiel Garcia /* coeff probs */
30*fbb6c848SEzequiel Garcia u8 prob_coeffs[4][8][3][V4L2_VP8_COEFF_PROB_CNT];
31*fbb6c848SEzequiel Garcia u8 padding3[96];
32*fbb6c848SEzequiel Garcia };
33*fbb6c848SEzequiel Garcia
34*fbb6c848SEzequiel Garcia /*
35*fbb6c848SEzequiel Garcia * filter taps taken to 7-bit precision,
36*fbb6c848SEzequiel Garcia * reference RFC6386#Page-16, filters[8][6]
37*fbb6c848SEzequiel Garcia */
38*fbb6c848SEzequiel Garcia const u32 hantro_vp8_dec_mc_filter[8][6] = {
39*fbb6c848SEzequiel Garcia { 0, 0, 128, 0, 0, 0 },
40*fbb6c848SEzequiel Garcia { 0, -6, 123, 12, -1, 0 },
41*fbb6c848SEzequiel Garcia { 2, -11, 108, 36, -8, 1 },
42*fbb6c848SEzequiel Garcia { 0, -9, 93, 50, -6, 0 },
43*fbb6c848SEzequiel Garcia { 3, -16, 77, 77, -16, 3 },
44*fbb6c848SEzequiel Garcia { 0, -6, 50, 93, -9, 0 },
45*fbb6c848SEzequiel Garcia { 1, -8, 36, 108, -11, 2 },
46*fbb6c848SEzequiel Garcia { 0, -1, 12, 123, -6, 0 }
47*fbb6c848SEzequiel Garcia };
48*fbb6c848SEzequiel Garcia
hantro_vp8_prob_update(struct hantro_ctx * ctx,const struct v4l2_ctrl_vp8_frame * hdr)49*fbb6c848SEzequiel Garcia void hantro_vp8_prob_update(struct hantro_ctx *ctx,
50*fbb6c848SEzequiel Garcia const struct v4l2_ctrl_vp8_frame *hdr)
51*fbb6c848SEzequiel Garcia {
52*fbb6c848SEzequiel Garcia const struct v4l2_vp8_entropy *entropy = &hdr->entropy;
53*fbb6c848SEzequiel Garcia u32 i, j, k;
54*fbb6c848SEzequiel Garcia u8 *dst;
55*fbb6c848SEzequiel Garcia
56*fbb6c848SEzequiel Garcia /* first probs */
57*fbb6c848SEzequiel Garcia dst = ctx->vp8_dec.prob_tbl.cpu;
58*fbb6c848SEzequiel Garcia
59*fbb6c848SEzequiel Garcia dst[0] = hdr->prob_skip_false;
60*fbb6c848SEzequiel Garcia dst[1] = hdr->prob_intra;
61*fbb6c848SEzequiel Garcia dst[2] = hdr->prob_last;
62*fbb6c848SEzequiel Garcia dst[3] = hdr->prob_gf;
63*fbb6c848SEzequiel Garcia dst[4] = hdr->segment.segment_probs[0];
64*fbb6c848SEzequiel Garcia dst[5] = hdr->segment.segment_probs[1];
65*fbb6c848SEzequiel Garcia dst[6] = hdr->segment.segment_probs[2];
66*fbb6c848SEzequiel Garcia dst[7] = 0;
67*fbb6c848SEzequiel Garcia
68*fbb6c848SEzequiel Garcia dst += 8;
69*fbb6c848SEzequiel Garcia dst[0] = entropy->y_mode_probs[0];
70*fbb6c848SEzequiel Garcia dst[1] = entropy->y_mode_probs[1];
71*fbb6c848SEzequiel Garcia dst[2] = entropy->y_mode_probs[2];
72*fbb6c848SEzequiel Garcia dst[3] = entropy->y_mode_probs[3];
73*fbb6c848SEzequiel Garcia dst[4] = entropy->uv_mode_probs[0];
74*fbb6c848SEzequiel Garcia dst[5] = entropy->uv_mode_probs[1];
75*fbb6c848SEzequiel Garcia dst[6] = entropy->uv_mode_probs[2];
76*fbb6c848SEzequiel Garcia dst[7] = 0; /*unused */
77*fbb6c848SEzequiel Garcia
78*fbb6c848SEzequiel Garcia /* mv probs */
79*fbb6c848SEzequiel Garcia dst += 8;
80*fbb6c848SEzequiel Garcia dst[0] = entropy->mv_probs[0][0]; /* is short */
81*fbb6c848SEzequiel Garcia dst[1] = entropy->mv_probs[1][0];
82*fbb6c848SEzequiel Garcia dst[2] = entropy->mv_probs[0][1]; /* sign */
83*fbb6c848SEzequiel Garcia dst[3] = entropy->mv_probs[1][1];
84*fbb6c848SEzequiel Garcia dst[4] = entropy->mv_probs[0][8 + 9];
85*fbb6c848SEzequiel Garcia dst[5] = entropy->mv_probs[0][9 + 9];
86*fbb6c848SEzequiel Garcia dst[6] = entropy->mv_probs[1][8 + 9];
87*fbb6c848SEzequiel Garcia dst[7] = entropy->mv_probs[1][9 + 9];
88*fbb6c848SEzequiel Garcia dst += 8;
89*fbb6c848SEzequiel Garcia for (i = 0; i < 2; ++i) {
90*fbb6c848SEzequiel Garcia for (j = 0; j < 8; j += 4) {
91*fbb6c848SEzequiel Garcia dst[0] = entropy->mv_probs[i][j + 9 + 0];
92*fbb6c848SEzequiel Garcia dst[1] = entropy->mv_probs[i][j + 9 + 1];
93*fbb6c848SEzequiel Garcia dst[2] = entropy->mv_probs[i][j + 9 + 2];
94*fbb6c848SEzequiel Garcia dst[3] = entropy->mv_probs[i][j + 9 + 3];
95*fbb6c848SEzequiel Garcia dst += 4;
96*fbb6c848SEzequiel Garcia }
97*fbb6c848SEzequiel Garcia }
98*fbb6c848SEzequiel Garcia for (i = 0; i < 2; ++i) {
99*fbb6c848SEzequiel Garcia dst[0] = entropy->mv_probs[i][0 + 2];
100*fbb6c848SEzequiel Garcia dst[1] = entropy->mv_probs[i][1 + 2];
101*fbb6c848SEzequiel Garcia dst[2] = entropy->mv_probs[i][2 + 2];
102*fbb6c848SEzequiel Garcia dst[3] = entropy->mv_probs[i][3 + 2];
103*fbb6c848SEzequiel Garcia dst[4] = entropy->mv_probs[i][4 + 2];
104*fbb6c848SEzequiel Garcia dst[5] = entropy->mv_probs[i][5 + 2];
105*fbb6c848SEzequiel Garcia dst[6] = entropy->mv_probs[i][6 + 2];
106*fbb6c848SEzequiel Garcia dst[7] = 0; /*unused */
107*fbb6c848SEzequiel Garcia dst += 8;
108*fbb6c848SEzequiel Garcia }
109*fbb6c848SEzequiel Garcia
110*fbb6c848SEzequiel Garcia /* coeff probs (header part) */
111*fbb6c848SEzequiel Garcia dst = ctx->vp8_dec.prob_tbl.cpu;
112*fbb6c848SEzequiel Garcia dst += (8 * 7);
113*fbb6c848SEzequiel Garcia for (i = 0; i < 4; ++i) {
114*fbb6c848SEzequiel Garcia for (j = 0; j < 8; ++j) {
115*fbb6c848SEzequiel Garcia for (k = 0; k < 3; ++k) {
116*fbb6c848SEzequiel Garcia dst[0] = entropy->coeff_probs[i][j][k][0];
117*fbb6c848SEzequiel Garcia dst[1] = entropy->coeff_probs[i][j][k][1];
118*fbb6c848SEzequiel Garcia dst[2] = entropy->coeff_probs[i][j][k][2];
119*fbb6c848SEzequiel Garcia dst[3] = entropy->coeff_probs[i][j][k][3];
120*fbb6c848SEzequiel Garcia dst += 4;
121*fbb6c848SEzequiel Garcia }
122*fbb6c848SEzequiel Garcia }
123*fbb6c848SEzequiel Garcia }
124*fbb6c848SEzequiel Garcia
125*fbb6c848SEzequiel Garcia /* coeff probs (footer part) */
126*fbb6c848SEzequiel Garcia dst = ctx->vp8_dec.prob_tbl.cpu;
127*fbb6c848SEzequiel Garcia dst += (8 * 55);
128*fbb6c848SEzequiel Garcia for (i = 0; i < 4; ++i) {
129*fbb6c848SEzequiel Garcia for (j = 0; j < 8; ++j) {
130*fbb6c848SEzequiel Garcia for (k = 0; k < 3; ++k) {
131*fbb6c848SEzequiel Garcia dst[0] = entropy->coeff_probs[i][j][k][4];
132*fbb6c848SEzequiel Garcia dst[1] = entropy->coeff_probs[i][j][k][5];
133*fbb6c848SEzequiel Garcia dst[2] = entropy->coeff_probs[i][j][k][6];
134*fbb6c848SEzequiel Garcia dst[3] = entropy->coeff_probs[i][j][k][7];
135*fbb6c848SEzequiel Garcia dst[4] = entropy->coeff_probs[i][j][k][8];
136*fbb6c848SEzequiel Garcia dst[5] = entropy->coeff_probs[i][j][k][9];
137*fbb6c848SEzequiel Garcia dst[6] = entropy->coeff_probs[i][j][k][10];
138*fbb6c848SEzequiel Garcia dst[7] = 0; /*unused */
139*fbb6c848SEzequiel Garcia dst += 8;
140*fbb6c848SEzequiel Garcia }
141*fbb6c848SEzequiel Garcia }
142*fbb6c848SEzequiel Garcia }
143*fbb6c848SEzequiel Garcia }
144*fbb6c848SEzequiel Garcia
hantro_vp8_dec_init(struct hantro_ctx * ctx)145*fbb6c848SEzequiel Garcia int hantro_vp8_dec_init(struct hantro_ctx *ctx)
146*fbb6c848SEzequiel Garcia {
147*fbb6c848SEzequiel Garcia struct hantro_dev *vpu = ctx->dev;
148*fbb6c848SEzequiel Garcia struct hantro_aux_buf *aux_buf;
149*fbb6c848SEzequiel Garcia unsigned int mb_width, mb_height;
150*fbb6c848SEzequiel Garcia size_t segment_map_size;
151*fbb6c848SEzequiel Garcia int ret;
152*fbb6c848SEzequiel Garcia
153*fbb6c848SEzequiel Garcia /* segment map table size calculation */
154*fbb6c848SEzequiel Garcia mb_width = DIV_ROUND_UP(ctx->dst_fmt.width, 16);
155*fbb6c848SEzequiel Garcia mb_height = DIV_ROUND_UP(ctx->dst_fmt.height, 16);
156*fbb6c848SEzequiel Garcia segment_map_size = round_up(DIV_ROUND_UP(mb_width * mb_height, 4), 64);
157*fbb6c848SEzequiel Garcia
158*fbb6c848SEzequiel Garcia /*
159*fbb6c848SEzequiel Garcia * In context init the dma buffer for segment map must be allocated.
160*fbb6c848SEzequiel Garcia * And the data in segment map buffer must be set to all zero.
161*fbb6c848SEzequiel Garcia */
162*fbb6c848SEzequiel Garcia aux_buf = &ctx->vp8_dec.segment_map;
163*fbb6c848SEzequiel Garcia aux_buf->size = segment_map_size;
164*fbb6c848SEzequiel Garcia aux_buf->cpu = dma_alloc_coherent(vpu->dev, aux_buf->size,
165*fbb6c848SEzequiel Garcia &aux_buf->dma, GFP_KERNEL);
166*fbb6c848SEzequiel Garcia if (!aux_buf->cpu)
167*fbb6c848SEzequiel Garcia return -ENOMEM;
168*fbb6c848SEzequiel Garcia
169*fbb6c848SEzequiel Garcia /*
170*fbb6c848SEzequiel Garcia * Allocate probability table buffer,
171*fbb6c848SEzequiel Garcia * total 1208 bytes, 4K page is far enough.
172*fbb6c848SEzequiel Garcia */
173*fbb6c848SEzequiel Garcia aux_buf = &ctx->vp8_dec.prob_tbl;
174*fbb6c848SEzequiel Garcia aux_buf->size = sizeof(struct vp8_prob_tbl_packed);
175*fbb6c848SEzequiel Garcia aux_buf->cpu = dma_alloc_coherent(vpu->dev, aux_buf->size,
176*fbb6c848SEzequiel Garcia &aux_buf->dma, GFP_KERNEL);
177*fbb6c848SEzequiel Garcia if (!aux_buf->cpu) {
178*fbb6c848SEzequiel Garcia ret = -ENOMEM;
179*fbb6c848SEzequiel Garcia goto err_free_seg_map;
180*fbb6c848SEzequiel Garcia }
181*fbb6c848SEzequiel Garcia
182*fbb6c848SEzequiel Garcia return 0;
183*fbb6c848SEzequiel Garcia
184*fbb6c848SEzequiel Garcia err_free_seg_map:
185*fbb6c848SEzequiel Garcia dma_free_coherent(vpu->dev, ctx->vp8_dec.segment_map.size,
186*fbb6c848SEzequiel Garcia ctx->vp8_dec.segment_map.cpu,
187*fbb6c848SEzequiel Garcia ctx->vp8_dec.segment_map.dma);
188*fbb6c848SEzequiel Garcia
189*fbb6c848SEzequiel Garcia return ret;
190*fbb6c848SEzequiel Garcia }
191*fbb6c848SEzequiel Garcia
hantro_vp8_dec_exit(struct hantro_ctx * ctx)192*fbb6c848SEzequiel Garcia void hantro_vp8_dec_exit(struct hantro_ctx *ctx)
193*fbb6c848SEzequiel Garcia {
194*fbb6c848SEzequiel Garcia struct hantro_vp8_dec_hw_ctx *vp8_dec = &ctx->vp8_dec;
195*fbb6c848SEzequiel Garcia struct hantro_dev *vpu = ctx->dev;
196*fbb6c848SEzequiel Garcia
197*fbb6c848SEzequiel Garcia dma_free_coherent(vpu->dev, vp8_dec->segment_map.size,
198*fbb6c848SEzequiel Garcia vp8_dec->segment_map.cpu, vp8_dec->segment_map.dma);
199*fbb6c848SEzequiel Garcia dma_free_coherent(vpu->dev, vp8_dec->prob_tbl.size,
200*fbb6c848SEzequiel Garcia vp8_dec->prob_tbl.cpu, vp8_dec->prob_tbl.dma);
201*fbb6c848SEzequiel Garcia }
202