Commit | Line | Data |
---|---|---|
2ba45a60 DM |
1 | /* |
2 | * HEVC video decoder | |
3 | * | |
4 | * Copyright (C) 2012 - 2013 Guillaume Martres | |
5 | * Copyright (C) 2013 Seppo Tomperi | |
6 | * Copyright (C) 2013 Wassim Hamidouche | |
7 | * | |
8 | * This file is part of FFmpeg. | |
9 | * | |
10 | * FFmpeg is free software; you can redistribute it and/or | |
11 | * modify it under the terms of the GNU Lesser General Public | |
12 | * License as published by the Free Software Foundation; either | |
13 | * version 2.1 of the License, or (at your option) any later version. | |
14 | * | |
15 | * FFmpeg is distributed in the hope that it will be useful, | |
16 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
17 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
18 | * Lesser General Public License for more details. | |
19 | * | |
20 | * You should have received a copy of the GNU Lesser General Public | |
21 | * License along with FFmpeg; if not, write to the Free Software | |
22 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | |
23 | */ | |
24 | ||
25 | #include "libavutil/common.h" | |
26 | #include "libavutil/internal.h" | |
27 | ||
28 | #include "cabac_functions.h" | |
29 | #include "golomb.h" | |
30 | #include "hevc.h" | |
31 | ||
32 | #include "bit_depth_template.c" | |
33 | ||
34 | #define LUMA 0 | |
35 | #define CB 1 | |
36 | #define CR 2 | |
37 | ||
38 | static const uint8_t tctable[54] = { | |
39 | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, // QP 0...18 | |
40 | 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3, 4, 4, 4, // QP 19...37 | |
41 | 5, 5, 6, 6, 7, 8, 9, 10, 11, 13, 14, 16, 18, 20, 22, 24 // QP 38...53 | |
42 | }; | |
43 | ||
44 | static const uint8_t betatable[52] = { | |
45 | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 6, 7, 8, // QP 0...18 | |
46 | 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 20, 22, 24, 26, 28, 30, 32, 34, 36, // QP 19...37 | |
47 | 38, 40, 42, 44, 46, 48, 50, 52, 54, 56, 58, 60, 62, 64 // QP 38...51 | |
48 | }; | |
49 | ||
50 | static int chroma_tc(HEVCContext *s, int qp_y, int c_idx, int tc_offset) | |
51 | { | |
52 | static const int qp_c[] = { | |
53 | 29, 30, 31, 32, 33, 33, 34, 34, 35, 35, 36, 36, 37, 37 | |
54 | }; | |
55 | int qp, qp_i, offset, idxt; | |
56 | ||
57 | // slice qp offset is not used for deblocking | |
58 | if (c_idx == 1) | |
59 | offset = s->pps->cb_qp_offset; | |
60 | else | |
61 | offset = s->pps->cr_qp_offset; | |
62 | ||
63 | qp_i = av_clip(qp_y + offset, 0, 57); | |
64 | if (s->sps->chroma_format_idc == 1) { | |
65 | if (qp_i < 30) | |
66 | qp = qp_i; | |
67 | else if (qp_i > 43) | |
68 | qp = qp_i - 6; | |
69 | else | |
70 | qp = qp_c[qp_i - 30]; | |
71 | } else { | |
72 | qp = av_clip(qp_i, 0, 51); | |
73 | } | |
74 | ||
75 | idxt = av_clip(qp + DEFAULT_INTRA_TC_OFFSET + tc_offset, 0, 53); | |
76 | return tctable[idxt]; | |
77 | } | |
78 | ||
79 | static int get_qPy_pred(HEVCContext *s, int xBase, int yBase, int log2_cb_size) | |
80 | { | |
81 | HEVCLocalContext *lc = s->HEVClc; | |
82 | int ctb_size_mask = (1 << s->sps->log2_ctb_size) - 1; | |
83 | int MinCuQpDeltaSizeMask = (1 << (s->sps->log2_ctb_size - | |
84 | s->pps->diff_cu_qp_delta_depth)) - 1; | |
85 | int xQgBase = xBase - (xBase & MinCuQpDeltaSizeMask); | |
86 | int yQgBase = yBase - (yBase & MinCuQpDeltaSizeMask); | |
87 | int min_cb_width = s->sps->min_cb_width; | |
88 | int x_cb = xQgBase >> s->sps->log2_min_cb_size; | |
89 | int y_cb = yQgBase >> s->sps->log2_min_cb_size; | |
90 | int availableA = (xBase & ctb_size_mask) && | |
91 | (xQgBase & ctb_size_mask); | |
92 | int availableB = (yBase & ctb_size_mask) && | |
93 | (yQgBase & ctb_size_mask); | |
94 | int qPy_pred, qPy_a, qPy_b; | |
95 | ||
96 | // qPy_pred | |
97 | if (lc->first_qp_group || (!xQgBase && !yQgBase)) { | |
98 | lc->first_qp_group = !lc->tu.is_cu_qp_delta_coded; | |
99 | qPy_pred = s->sh.slice_qp; | |
100 | } else { | |
101 | qPy_pred = lc->qPy_pred; | |
102 | } | |
103 | ||
104 | // qPy_a | |
105 | if (availableA == 0) | |
106 | qPy_a = qPy_pred; | |
107 | else | |
108 | qPy_a = s->qp_y_tab[(x_cb - 1) + y_cb * min_cb_width]; | |
109 | ||
110 | // qPy_b | |
111 | if (availableB == 0) | |
112 | qPy_b = qPy_pred; | |
113 | else | |
114 | qPy_b = s->qp_y_tab[x_cb + (y_cb - 1) * min_cb_width]; | |
115 | ||
116 | av_assert2(qPy_a >= -s->sps->qp_bd_offset && qPy_a < 52); | |
117 | av_assert2(qPy_b >= -s->sps->qp_bd_offset && qPy_b < 52); | |
118 | ||
119 | return (qPy_a + qPy_b + 1) >> 1; | |
120 | } | |
121 | ||
122 | void ff_hevc_set_qPy(HEVCContext *s, int xBase, int yBase, int log2_cb_size) | |
123 | { | |
124 | int qp_y = get_qPy_pred(s, xBase, yBase, log2_cb_size); | |
125 | ||
126 | if (s->HEVClc->tu.cu_qp_delta != 0) { | |
127 | int off = s->sps->qp_bd_offset; | |
128 | s->HEVClc->qp_y = FFUMOD(qp_y + s->HEVClc->tu.cu_qp_delta + 52 + 2 * off, | |
129 | 52 + off) - off; | |
130 | } else | |
131 | s->HEVClc->qp_y = qp_y; | |
132 | } | |
133 | ||
134 | static int get_qPy(HEVCContext *s, int xC, int yC) | |
135 | { | |
136 | int log2_min_cb_size = s->sps->log2_min_cb_size; | |
137 | int x = xC >> log2_min_cb_size; | |
138 | int y = yC >> log2_min_cb_size; | |
139 | return s->qp_y_tab[x + y * s->sps->min_cb_width]; | |
140 | } | |
141 | ||
142 | static void copy_CTB(uint8_t *dst, uint8_t *src, | |
143 | int width, int height, int stride_dst, int stride_src) | |
144 | { | |
145 | int i; | |
146 | ||
147 | for (i = 0; i < height; i++) { | |
148 | memcpy(dst, src, width); | |
149 | dst += stride_dst; | |
150 | src += stride_src; | |
151 | } | |
152 | } | |
153 | ||
154 | static void restore_tqb_pixels(HEVCContext *s, int x0, int y0, int width, int height, int c_idx) | |
155 | { | |
156 | if ( s->pps->transquant_bypass_enable_flag || | |
157 | (s->sps->pcm.loop_filter_disable_flag && s->sps->pcm_enabled_flag)) { | |
158 | int x, y; | |
159 | ptrdiff_t stride_dst = s->sao_frame->linesize[c_idx]; | |
160 | ptrdiff_t stride_src = s->frame->linesize[c_idx]; | |
161 | int min_pu_size = 1 << s->sps->log2_min_pu_size; | |
162 | int hshift = s->sps->hshift[c_idx]; | |
163 | int vshift = s->sps->vshift[c_idx]; | |
164 | int x_min = ((x0 ) >> s->sps->log2_min_pu_size); | |
165 | int y_min = ((y0 ) >> s->sps->log2_min_pu_size); | |
166 | int x_max = ((x0 + width ) >> s->sps->log2_min_pu_size); | |
167 | int y_max = ((y0 + height) >> s->sps->log2_min_pu_size); | |
168 | int len = min_pu_size >> hshift; | |
169 | for (y = y_min; y < y_max; y++) { | |
170 | for (x = x_min; x < x_max; x++) { | |
171 | if (s->is_pcm[y * s->sps->min_pu_width + x]) { | |
172 | int n; | |
173 | uint8_t *src = &s->frame->data[c_idx][ ((y << s->sps->log2_min_pu_size) >> vshift) * stride_src + (((x << s->sps->log2_min_pu_size) >> hshift) << s->sps->pixel_shift)]; | |
174 | uint8_t *dst = &s->sao_frame->data[c_idx][((y << s->sps->log2_min_pu_size) >> vshift) * stride_dst + (((x << s->sps->log2_min_pu_size) >> hshift) << s->sps->pixel_shift)]; | |
175 | for (n = 0; n < (min_pu_size >> vshift); n++) { | |
176 | memcpy(src, dst, len); | |
177 | src += stride_src; | |
178 | dst += stride_dst; | |
179 | } | |
180 | } | |
181 | } | |
182 | } | |
183 | } | |
184 | } | |
185 | ||
186 | #define CTB(tab, x, y) ((tab)[(y) * s->sps->ctb_width + (x)]) | |
187 | ||
188 | static void sao_filter_CTB(HEVCContext *s, int x, int y) | |
189 | { | |
190 | int c_idx; | |
191 | int edges[4]; // 0 left 1 top 2 right 3 bottom | |
192 | int x_ctb = x >> s->sps->log2_ctb_size; | |
193 | int y_ctb = y >> s->sps->log2_ctb_size; | |
194 | int ctb_addr_rs = y_ctb * s->sps->ctb_width + x_ctb; | |
195 | int ctb_addr_ts = s->pps->ctb_addr_rs_to_ts[ctb_addr_rs]; | |
196 | SAOParams *sao = &CTB(s->sao, x_ctb, y_ctb); | |
197 | // flags indicating unfilterable edges | |
198 | uint8_t vert_edge[] = { 0, 0 }; | |
199 | uint8_t horiz_edge[] = { 0, 0 }; | |
200 | uint8_t diag_edge[] = { 0, 0, 0, 0 }; | |
201 | uint8_t lfase = CTB(s->filter_slice_edges, x_ctb, y_ctb); | |
202 | uint8_t no_tile_filter = s->pps->tiles_enabled_flag && | |
203 | !s->pps->loop_filter_across_tiles_enabled_flag; | |
204 | uint8_t restore = no_tile_filter || !lfase; | |
205 | uint8_t left_tile_edge = 0; | |
206 | uint8_t right_tile_edge = 0; | |
207 | uint8_t up_tile_edge = 0; | |
208 | uint8_t bottom_tile_edge = 0; | |
209 | ||
210 | edges[0] = x_ctb == 0; | |
211 | edges[1] = y_ctb == 0; | |
212 | edges[2] = x_ctb == s->sps->ctb_width - 1; | |
213 | edges[3] = y_ctb == s->sps->ctb_height - 1; | |
214 | ||
215 | if (restore) { | |
216 | if (!edges[0]) { | |
217 | left_tile_edge = no_tile_filter && s->pps->tile_id[ctb_addr_ts] != s->pps->tile_id[s->pps->ctb_addr_rs_to_ts[ctb_addr_rs-1]]; | |
218 | vert_edge[0] = (!lfase && CTB(s->tab_slice_address, x_ctb, y_ctb) != CTB(s->tab_slice_address, x_ctb - 1, y_ctb)) || left_tile_edge; | |
219 | } | |
220 | if (!edges[2]) { | |
221 | right_tile_edge = no_tile_filter && s->pps->tile_id[ctb_addr_ts] != s->pps->tile_id[s->pps->ctb_addr_rs_to_ts[ctb_addr_rs+1]]; | |
222 | vert_edge[1] = (!lfase && CTB(s->tab_slice_address, x_ctb, y_ctb) != CTB(s->tab_slice_address, x_ctb + 1, y_ctb)) || right_tile_edge; | |
223 | } | |
224 | if (!edges[1]) { | |
225 | up_tile_edge = no_tile_filter && s->pps->tile_id[ctb_addr_ts] != s->pps->tile_id[s->pps->ctb_addr_rs_to_ts[ctb_addr_rs - s->sps->ctb_width]]; | |
226 | horiz_edge[0] = (!lfase && CTB(s->tab_slice_address, x_ctb, y_ctb) != CTB(s->tab_slice_address, x_ctb, y_ctb - 1)) || up_tile_edge; | |
227 | } | |
228 | if (!edges[3]) { | |
229 | bottom_tile_edge = no_tile_filter && s->pps->tile_id[ctb_addr_ts] != s->pps->tile_id[s->pps->ctb_addr_rs_to_ts[ctb_addr_rs + s->sps->ctb_width]]; | |
230 | horiz_edge[1] = (!lfase && CTB(s->tab_slice_address, x_ctb, y_ctb) != CTB(s->tab_slice_address, x_ctb, y_ctb + 1)) || bottom_tile_edge; | |
231 | } | |
232 | if (!edges[0] && !edges[1]) { | |
233 | diag_edge[0] = (!lfase && CTB(s->tab_slice_address, x_ctb, y_ctb) != CTB(s->tab_slice_address, x_ctb - 1, y_ctb - 1)) || left_tile_edge || up_tile_edge; | |
234 | } | |
235 | if (!edges[1] && !edges[2]) { | |
236 | diag_edge[1] = (!lfase && CTB(s->tab_slice_address, x_ctb, y_ctb) != CTB(s->tab_slice_address, x_ctb + 1, y_ctb - 1)) || right_tile_edge || up_tile_edge; | |
237 | } | |
238 | if (!edges[2] && !edges[3]) { | |
239 | diag_edge[2] = (!lfase && CTB(s->tab_slice_address, x_ctb, y_ctb) != CTB(s->tab_slice_address, x_ctb + 1, y_ctb + 1)) || right_tile_edge || bottom_tile_edge; | |
240 | } | |
241 | if (!edges[0] && !edges[3]) { | |
242 | diag_edge[3] = (!lfase && CTB(s->tab_slice_address, x_ctb, y_ctb) != CTB(s->tab_slice_address, x_ctb - 1, y_ctb + 1)) || left_tile_edge || bottom_tile_edge; | |
243 | } | |
244 | } | |
245 | ||
246 | for (c_idx = 0; c_idx < 3; c_idx++) { | |
247 | int x0 = x >> s->sps->hshift[c_idx]; | |
248 | int y0 = y >> s->sps->vshift[c_idx]; | |
249 | int stride_src = s->frame->linesize[c_idx]; | |
250 | int stride_dst = s->sao_frame->linesize[c_idx]; | |
251 | int ctb_size_h = (1 << (s->sps->log2_ctb_size)) >> s->sps->hshift[c_idx]; | |
252 | int ctb_size_v = (1 << (s->sps->log2_ctb_size)) >> s->sps->vshift[c_idx]; | |
253 | int width = FFMIN(ctb_size_h, (s->sps->width >> s->sps->hshift[c_idx]) - x0); | |
254 | int height = FFMIN(ctb_size_v, (s->sps->height >> s->sps->vshift[c_idx]) - y0); | |
255 | uint8_t *src = &s->frame->data[c_idx][y0 * stride_src + (x0 << s->sps->pixel_shift)]; | |
256 | uint8_t *dst = &s->sao_frame->data[c_idx][y0 * stride_dst + (x0 << s->sps->pixel_shift)]; | |
257 | ||
258 | switch (sao->type_idx[c_idx]) { | |
259 | case SAO_BAND: | |
260 | copy_CTB(dst, src, width << s->sps->pixel_shift, height, stride_dst, stride_src); | |
261 | s->hevcdsp.sao_band_filter(src, dst, | |
262 | stride_src, stride_dst, | |
263 | sao, | |
264 | edges, width, | |
265 | height, c_idx); | |
266 | restore_tqb_pixels(s, x, y, width, height, c_idx); | |
267 | sao->type_idx[c_idx] = SAO_APPLIED; | |
268 | break; | |
269 | case SAO_EDGE: | |
270 | { | |
271 | uint8_t left_pixels = !edges[0] && (CTB(s->sao, x_ctb-1, y_ctb).type_idx[c_idx] != SAO_APPLIED); | |
272 | if (!edges[1]) { | |
273 | uint8_t top_left = !edges[0] && (CTB(s->sao, x_ctb-1, y_ctb-1).type_idx[c_idx] != SAO_APPLIED); | |
274 | uint8_t top_right = !edges[2] && (CTB(s->sao, x_ctb+1, y_ctb-1).type_idx[c_idx] != SAO_APPLIED); | |
275 | if (CTB(s->sao, x_ctb , y_ctb-1).type_idx[c_idx] == 0) | |
276 | memcpy( dst - stride_dst - (top_left << s->sps->pixel_shift), | |
277 | src - stride_src - (top_left << s->sps->pixel_shift), | |
278 | (top_left + width + top_right) << s->sps->pixel_shift); | |
279 | else { | |
280 | if (top_left) | |
281 | memcpy( dst - stride_dst - (1 << s->sps->pixel_shift), | |
282 | src - stride_src - (1 << s->sps->pixel_shift), | |
283 | 1 << s->sps->pixel_shift); | |
284 | if(top_right) | |
285 | memcpy( dst - stride_dst + (width << s->sps->pixel_shift), | |
286 | src - stride_src + (width << s->sps->pixel_shift), | |
287 | 1 << s->sps->pixel_shift); | |
288 | } | |
289 | } | |
290 | if (!edges[3]) { // bottom and bottom right | |
291 | uint8_t bottom_left = !edges[0] && (CTB(s->sao, x_ctb-1, y_ctb+1).type_idx[c_idx] != SAO_APPLIED); | |
292 | memcpy( dst + height * stride_dst - (bottom_left << s->sps->pixel_shift), | |
293 | src + height * stride_src - (bottom_left << s->sps->pixel_shift), | |
294 | (width + 1 + bottom_left) << s->sps->pixel_shift); | |
295 | } | |
296 | copy_CTB(dst - (left_pixels << s->sps->pixel_shift), | |
297 | src - (left_pixels << s->sps->pixel_shift), | |
298 | (width + 1 + left_pixels) << s->sps->pixel_shift, height, stride_dst, stride_src); | |
299 | s->hevcdsp.sao_edge_filter[restore](src, dst, | |
300 | stride_src, stride_dst, | |
301 | sao, | |
302 | edges, width, | |
303 | height, c_idx, | |
304 | vert_edge, | |
305 | horiz_edge, | |
306 | diag_edge); | |
307 | restore_tqb_pixels(s, x, y, width, height, c_idx); | |
308 | sao->type_idx[c_idx] = SAO_APPLIED; | |
309 | break; | |
310 | } | |
311 | } | |
312 | } | |
313 | } | |
314 | ||
315 | static int get_pcm(HEVCContext *s, int x, int y) | |
316 | { | |
317 | int log2_min_pu_size = s->sps->log2_min_pu_size; | |
318 | int x_pu, y_pu; | |
319 | ||
320 | if (x < 0 || y < 0) | |
321 | return 2; | |
322 | ||
323 | x_pu = x >> log2_min_pu_size; | |
324 | y_pu = y >> log2_min_pu_size; | |
325 | ||
326 | if (x_pu >= s->sps->min_pu_width || y_pu >= s->sps->min_pu_height) | |
327 | return 2; | |
328 | return s->is_pcm[y_pu * s->sps->min_pu_width + x_pu]; | |
329 | } | |
330 | ||
331 | #define TC_CALC(qp, bs) \ | |
332 | tctable[av_clip((qp) + DEFAULT_INTRA_TC_OFFSET * ((bs) - 1) + \ | |
333 | (tc_offset >> 1 << 1), \ | |
334 | 0, MAX_QP + DEFAULT_INTRA_TC_OFFSET)] | |
335 | ||
336 | static void deblocking_filter_CTB(HEVCContext *s, int x0, int y0) | |
337 | { | |
338 | uint8_t *src; | |
339 | int x, y; | |
340 | int chroma, beta; | |
341 | int32_t c_tc[2], tc[2]; | |
342 | uint8_t no_p[2] = { 0 }; | |
343 | uint8_t no_q[2] = { 0 }; | |
344 | ||
345 | int log2_ctb_size = s->sps->log2_ctb_size; | |
346 | int x_end, x_end2, y_end; | |
347 | int ctb_size = 1 << log2_ctb_size; | |
348 | int ctb = (x0 >> log2_ctb_size) + | |
349 | (y0 >> log2_ctb_size) * s->sps->ctb_width; | |
350 | int cur_tc_offset = s->deblock[ctb].tc_offset; | |
351 | int cur_beta_offset = s->deblock[ctb].beta_offset; | |
352 | int left_tc_offset, left_beta_offset; | |
353 | int tc_offset, beta_offset; | |
354 | int pcmf = (s->sps->pcm_enabled_flag && | |
355 | s->sps->pcm.loop_filter_disable_flag) || | |
356 | s->pps->transquant_bypass_enable_flag; | |
357 | ||
358 | if (x0) { | |
359 | left_tc_offset = s->deblock[ctb - 1].tc_offset; | |
360 | left_beta_offset = s->deblock[ctb - 1].beta_offset; | |
361 | } else { | |
362 | left_tc_offset = 0; | |
363 | left_beta_offset = 0; | |
364 | } | |
365 | ||
366 | x_end = x0 + ctb_size; | |
367 | if (x_end > s->sps->width) | |
368 | x_end = s->sps->width; | |
369 | y_end = y0 + ctb_size; | |
370 | if (y_end > s->sps->height) | |
371 | y_end = s->sps->height; | |
372 | ||
373 | tc_offset = cur_tc_offset; | |
374 | beta_offset = cur_beta_offset; | |
375 | ||
376 | x_end2 = x_end; | |
377 | if (x_end2 != s->sps->width) | |
378 | x_end2 -= 8; | |
379 | for (y = y0; y < y_end; y += 8) { | |
380 | // vertical filtering luma | |
381 | for (x = x0 ? x0 : 8; x < x_end; x += 8) { | |
382 | const int bs0 = s->vertical_bs[(x + y * s->bs_width) >> 2]; | |
383 | const int bs1 = s->vertical_bs[(x + (y + 4) * s->bs_width) >> 2]; | |
384 | if (bs0 || bs1) { | |
385 | const int qp = (get_qPy(s, x - 1, y) + get_qPy(s, x, y) + 1) >> 1; | |
386 | ||
387 | beta = betatable[av_clip(qp + beta_offset, 0, MAX_QP)]; | |
388 | ||
389 | tc[0] = bs0 ? TC_CALC(qp, bs0) : 0; | |
390 | tc[1] = bs1 ? TC_CALC(qp, bs1) : 0; | |
391 | src = &s->frame->data[LUMA][y * s->frame->linesize[LUMA] + (x << s->sps->pixel_shift)]; | |
392 | if (pcmf) { | |
393 | no_p[0] = get_pcm(s, x - 1, y); | |
394 | no_p[1] = get_pcm(s, x - 1, y + 4); | |
395 | no_q[0] = get_pcm(s, x, y); | |
396 | no_q[1] = get_pcm(s, x, y + 4); | |
397 | s->hevcdsp.hevc_v_loop_filter_luma_c(src, | |
398 | s->frame->linesize[LUMA], | |
399 | beta, tc, no_p, no_q); | |
400 | } else | |
401 | s->hevcdsp.hevc_v_loop_filter_luma(src, | |
402 | s->frame->linesize[LUMA], | |
403 | beta, tc, no_p, no_q); | |
404 | } | |
405 | } | |
406 | ||
407 | if(!y) | |
408 | continue; | |
409 | ||
410 | // horizontal filtering luma | |
411 | for (x = x0 ? x0 - 8 : 0; x < x_end2; x += 8) { | |
412 | const int bs0 = s->horizontal_bs[( x + y * s->bs_width) >> 2]; | |
413 | const int bs1 = s->horizontal_bs[((x + 4) + y * s->bs_width) >> 2]; | |
414 | if (bs0 || bs1) { | |
415 | const int qp = (get_qPy(s, x, y - 1) + get_qPy(s, x, y) + 1) >> 1; | |
416 | ||
417 | tc_offset = x >= x0 ? cur_tc_offset : left_tc_offset; | |
418 | beta_offset = x >= x0 ? cur_beta_offset : left_beta_offset; | |
419 | ||
420 | beta = betatable[av_clip(qp + beta_offset, 0, MAX_QP)]; | |
421 | tc[0] = bs0 ? TC_CALC(qp, bs0) : 0; | |
422 | tc[1] = bs1 ? TC_CALC(qp, bs1) : 0; | |
423 | src = &s->frame->data[LUMA][y * s->frame->linesize[LUMA] + (x << s->sps->pixel_shift)]; | |
424 | if (pcmf) { | |
425 | no_p[0] = get_pcm(s, x, y - 1); | |
426 | no_p[1] = get_pcm(s, x + 4, y - 1); | |
427 | no_q[0] = get_pcm(s, x, y); | |
428 | no_q[1] = get_pcm(s, x + 4, y); | |
429 | s->hevcdsp.hevc_h_loop_filter_luma_c(src, | |
430 | s->frame->linesize[LUMA], | |
431 | beta, tc, no_p, no_q); | |
432 | } else | |
433 | s->hevcdsp.hevc_h_loop_filter_luma(src, | |
434 | s->frame->linesize[LUMA], | |
435 | beta, tc, no_p, no_q); | |
436 | } | |
437 | } | |
438 | } | |
439 | ||
440 | for (chroma = 1; chroma <= 2; chroma++) { | |
441 | int h = 1 << s->sps->hshift[chroma]; | |
442 | int v = 1 << s->sps->vshift[chroma]; | |
443 | ||
444 | // vertical filtering chroma | |
445 | for (y = y0; y < y_end; y += (8 * v)) { | |
446 | for (x = x0 ? x0 : 8 * h; x < x_end; x += (8 * h)) { | |
447 | const int bs0 = s->vertical_bs[(x + y * s->bs_width) >> 2]; | |
448 | const int bs1 = s->vertical_bs[(x + (y + (4 * v)) * s->bs_width) >> 2]; | |
449 | ||
450 | if ((bs0 == 2) || (bs1 == 2)) { | |
451 | const int qp0 = (get_qPy(s, x - 1, y) + get_qPy(s, x, y) + 1) >> 1; | |
452 | const int qp1 = (get_qPy(s, x - 1, y + (4 * v)) + get_qPy(s, x, y + (4 * v)) + 1) >> 1; | |
453 | ||
454 | c_tc[0] = (bs0 == 2) ? chroma_tc(s, qp0, chroma, tc_offset) : 0; | |
455 | c_tc[1] = (bs1 == 2) ? chroma_tc(s, qp1, chroma, tc_offset) : 0; | |
456 | src = &s->frame->data[chroma][(y >> s->sps->vshift[chroma]) * s->frame->linesize[chroma] + ((x >> s->sps->hshift[chroma]) << s->sps->pixel_shift)]; | |
457 | if (pcmf) { | |
458 | no_p[0] = get_pcm(s, x - 1, y); | |
459 | no_p[1] = get_pcm(s, x - 1, y + (4 * v)); | |
460 | no_q[0] = get_pcm(s, x, y); | |
461 | no_q[1] = get_pcm(s, x, y + (4 * v)); | |
462 | s->hevcdsp.hevc_v_loop_filter_chroma_c(src, | |
463 | s->frame->linesize[chroma], | |
464 | c_tc, no_p, no_q); | |
465 | } else | |
466 | s->hevcdsp.hevc_v_loop_filter_chroma(src, | |
467 | s->frame->linesize[chroma], | |
468 | c_tc, no_p, no_q); | |
469 | } | |
470 | } | |
471 | ||
472 | if(!y) | |
473 | continue; | |
474 | ||
475 | // horizontal filtering chroma | |
476 | tc_offset = x0 ? left_tc_offset : cur_tc_offset; | |
477 | x_end2 = x_end; | |
478 | if (x_end != s->sps->width) | |
479 | x_end2 = x_end - 8 * h; | |
480 | for (x = x0 ? x0 - 8 * h : 0; x < x_end2; x += (8 * h)) { | |
481 | const int bs0 = s->horizontal_bs[( x + y * s->bs_width) >> 2]; | |
482 | const int bs1 = s->horizontal_bs[((x + 4 * h) + y * s->bs_width) >> 2]; | |
483 | if ((bs0 == 2) || (bs1 == 2)) { | |
484 | const int qp0 = bs0 == 2 ? (get_qPy(s, x, y - 1) + get_qPy(s, x, y) + 1) >> 1 : 0; | |
485 | const int qp1 = bs1 == 2 ? (get_qPy(s, x + (4 * h), y - 1) + get_qPy(s, x + (4 * h), y) + 1) >> 1 : 0; | |
486 | ||
487 | c_tc[0] = bs0 == 2 ? chroma_tc(s, qp0, chroma, tc_offset) : 0; | |
488 | c_tc[1] = bs1 == 2 ? chroma_tc(s, qp1, chroma, cur_tc_offset) : 0; | |
489 | src = &s->frame->data[chroma][(y >> s->sps->vshift[1]) * s->frame->linesize[chroma] + ((x >> s->sps->hshift[1]) << s->sps->pixel_shift)]; | |
490 | if (pcmf) { | |
491 | no_p[0] = get_pcm(s, x, y - 1); | |
492 | no_p[1] = get_pcm(s, x + (4 * h), y - 1); | |
493 | no_q[0] = get_pcm(s, x, y); | |
494 | no_q[1] = get_pcm(s, x + (4 * h), y); | |
495 | s->hevcdsp.hevc_h_loop_filter_chroma_c(src, | |
496 | s->frame->linesize[chroma], | |
497 | c_tc, no_p, no_q); | |
498 | } else | |
499 | s->hevcdsp.hevc_h_loop_filter_chroma(src, | |
500 | s->frame->linesize[chroma], | |
501 | c_tc, no_p, no_q); | |
502 | } | |
503 | } | |
504 | } | |
505 | } | |
506 | } | |
507 | ||
508 | static int boundary_strength(HEVCContext *s, MvField *curr, MvField *neigh, | |
509 | RefPicList *neigh_refPicList) | |
510 | { | |
511 | if (curr->pred_flag == PF_BI && neigh->pred_flag == PF_BI) { | |
512 | // same L0 and L1 | |
513 | if (s->ref->refPicList[0].list[curr->ref_idx[0]] == neigh_refPicList[0].list[neigh->ref_idx[0]] && | |
514 | s->ref->refPicList[0].list[curr->ref_idx[0]] == s->ref->refPicList[1].list[curr->ref_idx[1]] && | |
515 | neigh_refPicList[0].list[neigh->ref_idx[0]] == neigh_refPicList[1].list[neigh->ref_idx[1]]) { | |
516 | if ((FFABS(neigh->mv[0].x - curr->mv[0].x) >= 4 || FFABS(neigh->mv[0].y - curr->mv[0].y) >= 4 || | |
517 | FFABS(neigh->mv[1].x - curr->mv[1].x) >= 4 || FFABS(neigh->mv[1].y - curr->mv[1].y) >= 4) && | |
518 | (FFABS(neigh->mv[1].x - curr->mv[0].x) >= 4 || FFABS(neigh->mv[1].y - curr->mv[0].y) >= 4 || | |
519 | FFABS(neigh->mv[0].x - curr->mv[1].x) >= 4 || FFABS(neigh->mv[0].y - curr->mv[1].y) >= 4)) | |
520 | return 1; | |
521 | else | |
522 | return 0; | |
523 | } else if (neigh_refPicList[0].list[neigh->ref_idx[0]] == s->ref->refPicList[0].list[curr->ref_idx[0]] && | |
524 | neigh_refPicList[1].list[neigh->ref_idx[1]] == s->ref->refPicList[1].list[curr->ref_idx[1]]) { | |
525 | if (FFABS(neigh->mv[0].x - curr->mv[0].x) >= 4 || FFABS(neigh->mv[0].y - curr->mv[0].y) >= 4 || | |
526 | FFABS(neigh->mv[1].x - curr->mv[1].x) >= 4 || FFABS(neigh->mv[1].y - curr->mv[1].y) >= 4) | |
527 | return 1; | |
528 | else | |
529 | return 0; | |
530 | } else if (neigh_refPicList[1].list[neigh->ref_idx[1]] == s->ref->refPicList[0].list[curr->ref_idx[0]] && | |
531 | neigh_refPicList[0].list[neigh->ref_idx[0]] == s->ref->refPicList[1].list[curr->ref_idx[1]]) { | |
532 | if (FFABS(neigh->mv[1].x - curr->mv[0].x) >= 4 || FFABS(neigh->mv[1].y - curr->mv[0].y) >= 4 || | |
533 | FFABS(neigh->mv[0].x - curr->mv[1].x) >= 4 || FFABS(neigh->mv[0].y - curr->mv[1].y) >= 4) | |
534 | return 1; | |
535 | else | |
536 | return 0; | |
537 | } else { | |
538 | return 1; | |
539 | } | |
540 | } else if ((curr->pred_flag != PF_BI) && (neigh->pred_flag != PF_BI)){ // 1 MV | |
541 | Mv A, B; | |
542 | int ref_A, ref_B; | |
543 | ||
544 | if (curr->pred_flag & 1) { | |
545 | A = curr->mv[0]; | |
546 | ref_A = s->ref->refPicList[0].list[curr->ref_idx[0]]; | |
547 | } else { | |
548 | A = curr->mv[1]; | |
549 | ref_A = s->ref->refPicList[1].list[curr->ref_idx[1]]; | |
550 | } | |
551 | ||
552 | if (neigh->pred_flag & 1) { | |
553 | B = neigh->mv[0]; | |
554 | ref_B = neigh_refPicList[0].list[neigh->ref_idx[0]]; | |
555 | } else { | |
556 | B = neigh->mv[1]; | |
557 | ref_B = neigh_refPicList[1].list[neigh->ref_idx[1]]; | |
558 | } | |
559 | ||
560 | if (ref_A == ref_B) { | |
561 | if (FFABS(A.x - B.x) >= 4 || FFABS(A.y - B.y) >= 4) | |
562 | return 1; | |
563 | else | |
564 | return 0; | |
565 | } else | |
566 | return 1; | |
567 | } | |
568 | ||
569 | return 1; | |
570 | } | |
571 | ||
572 | void ff_hevc_deblocking_boundary_strengths(HEVCContext *s, int x0, int y0, | |
573 | int log2_trafo_size) | |
574 | { | |
575 | HEVCLocalContext *lc = s->HEVClc; | |
576 | MvField *tab_mvf = s->ref->tab_mvf; | |
577 | int log2_min_pu_size = s->sps->log2_min_pu_size; | |
578 | int log2_min_tu_size = s->sps->log2_min_tb_size; | |
579 | int min_pu_width = s->sps->min_pu_width; | |
580 | int min_tu_width = s->sps->min_tb_width; | |
581 | int is_intra = tab_mvf[(y0 >> log2_min_pu_size) * min_pu_width + | |
582 | (x0 >> log2_min_pu_size)].pred_flag == PF_INTRA; | |
583 | int boundary_upper, boundary_left; | |
584 | int i, j, bs; | |
585 | ||
586 | boundary_upper = y0 > 0 && !(y0 & 7); | |
587 | if (boundary_upper && | |
588 | ((!s->sh.slice_loop_filter_across_slices_enabled_flag && | |
589 | lc->boundary_flags & BOUNDARY_UPPER_SLICE && | |
590 | (y0 % (1 << s->sps->log2_ctb_size)) == 0) || | |
591 | (!s->pps->loop_filter_across_tiles_enabled_flag && | |
592 | lc->boundary_flags & BOUNDARY_UPPER_TILE && | |
593 | (y0 % (1 << s->sps->log2_ctb_size)) == 0))) | |
594 | boundary_upper = 0; | |
595 | ||
596 | if (boundary_upper) { | |
597 | RefPicList *rpl_top = (lc->boundary_flags & BOUNDARY_UPPER_SLICE) ? | |
598 | ff_hevc_get_ref_list(s, s->ref, x0, y0 - 1) : | |
599 | s->ref->refPicList; | |
600 | int yp_pu = (y0 - 1) >> log2_min_pu_size; | |
601 | int yq_pu = y0 >> log2_min_pu_size; | |
602 | int yp_tu = (y0 - 1) >> log2_min_tu_size; | |
603 | int yq_tu = y0 >> log2_min_tu_size; | |
604 | ||
605 | for (i = 0; i < (1 << log2_trafo_size); i += 4) { | |
606 | int x_pu = (x0 + i) >> log2_min_pu_size; | |
607 | int x_tu = (x0 + i) >> log2_min_tu_size; | |
608 | MvField *top = &tab_mvf[yp_pu * min_pu_width + x_pu]; | |
609 | MvField *curr = &tab_mvf[yq_pu * min_pu_width + x_pu]; | |
610 | uint8_t top_cbf_luma = s->cbf_luma[yp_tu * min_tu_width + x_tu]; | |
611 | uint8_t curr_cbf_luma = s->cbf_luma[yq_tu * min_tu_width + x_tu]; | |
612 | ||
613 | if (curr->pred_flag == PF_INTRA || top->pred_flag == PF_INTRA) | |
614 | bs = 2; | |
615 | else if (curr_cbf_luma || top_cbf_luma) | |
616 | bs = 1; | |
617 | else | |
618 | bs = boundary_strength(s, curr, top, rpl_top); | |
619 | s->horizontal_bs[((x0 + i) + y0 * s->bs_width) >> 2] = bs; | |
620 | } | |
621 | } | |
622 | ||
623 | // bs for vertical TU boundaries | |
624 | boundary_left = x0 > 0 && !(x0 & 7); | |
625 | if (boundary_left && | |
626 | ((!s->sh.slice_loop_filter_across_slices_enabled_flag && | |
627 | lc->boundary_flags & BOUNDARY_LEFT_SLICE && | |
628 | (x0 % (1 << s->sps->log2_ctb_size)) == 0) || | |
629 | (!s->pps->loop_filter_across_tiles_enabled_flag && | |
630 | lc->boundary_flags & BOUNDARY_LEFT_TILE && | |
631 | (x0 % (1 << s->sps->log2_ctb_size)) == 0))) | |
632 | boundary_left = 0; | |
633 | ||
634 | if (boundary_left) { | |
635 | RefPicList *rpl_left = (lc->boundary_flags & BOUNDARY_LEFT_SLICE) ? | |
636 | ff_hevc_get_ref_list(s, s->ref, x0 - 1, y0) : | |
637 | s->ref->refPicList; | |
638 | int xp_pu = (x0 - 1) >> log2_min_pu_size; | |
639 | int xq_pu = x0 >> log2_min_pu_size; | |
640 | int xp_tu = (x0 - 1) >> log2_min_tu_size; | |
641 | int xq_tu = x0 >> log2_min_tu_size; | |
642 | ||
643 | for (i = 0; i < (1 << log2_trafo_size); i += 4) { | |
644 | int y_pu = (y0 + i) >> log2_min_pu_size; | |
645 | int y_tu = (y0 + i) >> log2_min_tu_size; | |
646 | MvField *left = &tab_mvf[y_pu * min_pu_width + xp_pu]; | |
647 | MvField *curr = &tab_mvf[y_pu * min_pu_width + xq_pu]; | |
648 | uint8_t left_cbf_luma = s->cbf_luma[y_tu * min_tu_width + xp_tu]; | |
649 | uint8_t curr_cbf_luma = s->cbf_luma[y_tu * min_tu_width + xq_tu]; | |
650 | ||
651 | if (curr->pred_flag == PF_INTRA || left->pred_flag == PF_INTRA) | |
652 | bs = 2; | |
653 | else if (curr_cbf_luma || left_cbf_luma) | |
654 | bs = 1; | |
655 | else | |
656 | bs = boundary_strength(s, curr, left, rpl_left); | |
657 | s->vertical_bs[(x0 + (y0 + i) * s->bs_width) >> 2] = bs; | |
658 | } | |
659 | } | |
660 | ||
661 | if (log2_trafo_size > log2_min_pu_size && !is_intra) { | |
662 | RefPicList *rpl = s->ref->refPicList; | |
663 | ||
664 | // bs for TU internal horizontal PU boundaries | |
665 | for (j = 8; j < (1 << log2_trafo_size); j += 8) { | |
666 | int yp_pu = (y0 + j - 1) >> log2_min_pu_size; | |
667 | int yq_pu = (y0 + j) >> log2_min_pu_size; | |
668 | ||
669 | for (i = 0; i < (1 << log2_trafo_size); i += 4) { | |
670 | int x_pu = (x0 + i) >> log2_min_pu_size; | |
671 | MvField *top = &tab_mvf[yp_pu * min_pu_width + x_pu]; | |
672 | MvField *curr = &tab_mvf[yq_pu * min_pu_width + x_pu]; | |
673 | ||
674 | bs = boundary_strength(s, curr, top, rpl); | |
675 | s->horizontal_bs[((x0 + i) + (y0 + j) * s->bs_width) >> 2] = bs; | |
676 | } | |
677 | } | |
678 | ||
679 | // bs for TU internal vertical PU boundaries | |
680 | for (j = 0; j < (1 << log2_trafo_size); j += 4) { | |
681 | int y_pu = (y0 + j) >> log2_min_pu_size; | |
682 | ||
683 | for (i = 8; i < (1 << log2_trafo_size); i += 8) { | |
684 | int xp_pu = (x0 + i - 1) >> log2_min_pu_size; | |
685 | int xq_pu = (x0 + i) >> log2_min_pu_size; | |
686 | MvField *left = &tab_mvf[y_pu * min_pu_width + xp_pu]; | |
687 | MvField *curr = &tab_mvf[y_pu * min_pu_width + xq_pu]; | |
688 | ||
689 | bs = boundary_strength(s, curr, left, rpl); | |
690 | s->vertical_bs[((x0 + i) + (y0 + j) * s->bs_width) >> 2] = bs; | |
691 | } | |
692 | } | |
693 | } | |
694 | } | |
695 | ||
696 | #undef LUMA | |
697 | #undef CB | |
698 | #undef CR | |
699 | ||
700 | void ff_hevc_hls_filter(HEVCContext *s, int x, int y, int ctb_size) | |
701 | { | |
702 | int x_end = x >= s->sps->width - ctb_size; | |
703 | deblocking_filter_CTB(s, x, y); | |
704 | if (s->sps->sao_enabled) { | |
705 | int y_end = y >= s->sps->height - ctb_size; | |
706 | if (y && x) | |
707 | sao_filter_CTB(s, x - ctb_size, y - ctb_size); | |
708 | if (x && y_end) | |
709 | sao_filter_CTB(s, x - ctb_size, y); | |
710 | if (y && x_end) { | |
711 | sao_filter_CTB(s, x, y - ctb_size); | |
712 | if (s->threads_type & FF_THREAD_FRAME ) | |
713 | ff_thread_report_progress(&s->ref->tf, y, 0); | |
714 | } | |
715 | if (x_end && y_end) { | |
716 | sao_filter_CTB(s, x , y); | |
717 | if (s->threads_type & FF_THREAD_FRAME ) | |
718 | ff_thread_report_progress(&s->ref->tf, y + ctb_size, 0); | |
719 | } | |
720 | } else if (s->threads_type & FF_THREAD_FRAME && x_end) | |
721 | ff_thread_report_progress(&s->ref->tf, y + ctb_size - 4, 0); | |
722 | } | |
723 | ||
724 | void ff_hevc_hls_filters(HEVCContext *s, int x_ctb, int y_ctb, int ctb_size) | |
725 | { | |
726 | int x_end = x_ctb >= s->sps->width - ctb_size; | |
727 | int y_end = y_ctb >= s->sps->height - ctb_size; | |
728 | if (y_ctb && x_ctb) | |
729 | ff_hevc_hls_filter(s, x_ctb - ctb_size, y_ctb - ctb_size, ctb_size); | |
730 | if (y_ctb && x_end) | |
731 | ff_hevc_hls_filter(s, x_ctb, y_ctb - ctb_size, ctb_size); | |
732 | if (x_ctb && y_end) | |
733 | ff_hevc_hls_filter(s, x_ctb - ctb_size, y_ctb, ctb_size); | |
734 | } |