1 /*
2  * Copyright (c) 2017, Alliance for Open Media. All rights reserved
3  *
4  * This source code is subject to the terms of the BSD 2 Clause License and
5  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6  * was not distributed with this source code in the LICENSE file, you can
7  * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8  * Media Patent License 1.0 was not distributed with this source code in the
9  * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10  */
11 
12 #include "av1/decoder/decodetxb.h"
13 
14 #include "aom_ports/mem.h"
15 #include "av1/common/idct.h"
16 #include "av1/common/scan.h"
17 #include "av1/common/txb_common.h"
18 #include "av1/decoder/decodemv.h"
19 
20 #define ACCT_STR __func__
21 
read_golomb(MACROBLOCKD * xd,aom_reader * r)22 static int read_golomb(MACROBLOCKD *xd, aom_reader *r) {
23   int x = 1;
24   int length = 0;
25   int i = 0;
26 
27   while (!i) {
28     i = aom_read_bit(r, ACCT_STR);
29     ++length;
30     if (length > 20) {
31       aom_internal_error(xd->error_info, AOM_CODEC_CORRUPT_FRAME,
32                          "Invalid length in read_golomb");
33       break;
34     }
35   }
36 
37   for (i = 0; i < length - 1; ++i) {
38     x <<= 1;
39     x += aom_read_bit(r, ACCT_STR);
40   }
41 
42   return x - 1;
43 }
44 
rec_eob_pos(const int eob_token,const int extra)45 static INLINE int rec_eob_pos(const int eob_token, const int extra) {
46   int eob = av1_eob_group_start[eob_token];
47   if (eob > 2) {
48     eob += extra;
49   }
50   return eob;
51 }
52 
get_dqv(const int16_t * dequant,int coeff_idx,const qm_val_t * iqmatrix)53 static INLINE int get_dqv(const int16_t *dequant, int coeff_idx,
54                           const qm_val_t *iqmatrix) {
55   int dqv = dequant[!!coeff_idx];
56   if (iqmatrix != NULL)
57     dqv =
58         ((iqmatrix[coeff_idx] * dqv) + (1 << (AOM_QM_BITS - 1))) >> AOM_QM_BITS;
59   return dqv;
60 }
61 
read_coeffs_reverse_2d(aom_reader * r,TX_SIZE tx_size,int start_si,int end_si,const int16_t * scan,int bwl,uint8_t * levels,base_cdf_arr base_cdf,br_cdf_arr br_cdf)62 static INLINE void read_coeffs_reverse_2d(aom_reader *r, TX_SIZE tx_size,
63                                           int start_si, int end_si,
64                                           const int16_t *scan, int bwl,
65                                           uint8_t *levels,
66                                           base_cdf_arr base_cdf,
67                                           br_cdf_arr br_cdf) {
68   for (int c = end_si; c >= start_si; --c) {
69     const int pos = scan[c];
70     const int coeff_ctx = get_lower_levels_ctx_2d(levels, pos, bwl, tx_size);
71     const int nsymbs = 4;
72     int level = aom_read_symbol(r, base_cdf[coeff_ctx], nsymbs, ACCT_STR);
73     if (level > NUM_BASE_LEVELS) {
74       const int br_ctx = get_br_ctx_2d(levels, pos, bwl);
75       aom_cdf_prob *cdf = br_cdf[br_ctx];
76       for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) {
77         const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR);
78         level += k;
79         if (k < BR_CDF_SIZE - 1) break;
80       }
81     }
82     levels[get_padded_idx(pos, bwl)] = level;
83   }
84 }
85 
read_coeffs_reverse(aom_reader * r,TX_SIZE tx_size,TX_CLASS tx_class,int start_si,int end_si,const int16_t * scan,int bwl,uint8_t * levels,base_cdf_arr base_cdf,br_cdf_arr br_cdf)86 static INLINE void read_coeffs_reverse(aom_reader *r, TX_SIZE tx_size,
87                                        TX_CLASS tx_class, int start_si,
88                                        int end_si, const int16_t *scan, int bwl,
89                                        uint8_t *levels, base_cdf_arr base_cdf,
90                                        br_cdf_arr br_cdf) {
91   for (int c = end_si; c >= start_si; --c) {
92     const int pos = scan[c];
93     const int coeff_ctx =
94         get_lower_levels_ctx(levels, pos, bwl, tx_size, tx_class);
95     const int nsymbs = 4;
96     int level = aom_read_symbol(r, base_cdf[coeff_ctx], nsymbs, ACCT_STR);
97     if (level > NUM_BASE_LEVELS) {
98       const int br_ctx = get_br_ctx(levels, pos, bwl, tx_class);
99       aom_cdf_prob *cdf = br_cdf[br_ctx];
100       for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) {
101         const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR);
102         level += k;
103         if (k < BR_CDF_SIZE - 1) break;
104       }
105     }
106     levels[get_padded_idx(pos, bwl)] = level;
107   }
108 }
109 
av1_read_coeffs_txb(const AV1_COMMON * const cm,DecoderCodingBlock * dcb,aom_reader * const r,const int blk_row,const int blk_col,const int plane,const TXB_CTX * const txb_ctx,const TX_SIZE tx_size)110 uint8_t av1_read_coeffs_txb(const AV1_COMMON *const cm, DecoderCodingBlock *dcb,
111                             aom_reader *const r, const int blk_row,
112                             const int blk_col, const int plane,
113                             const TXB_CTX *const txb_ctx,
114                             const TX_SIZE tx_size) {
115   MACROBLOCKD *const xd = &dcb->xd;
116   FRAME_CONTEXT *const ec_ctx = xd->tile_ctx;
117   const int32_t max_value = (1 << (7 + xd->bd)) - 1;
118   const int32_t min_value = -(1 << (7 + xd->bd));
119   const TX_SIZE txs_ctx = get_txsize_entropy_ctx(tx_size);
120   const PLANE_TYPE plane_type = get_plane_type(plane);
121   MB_MODE_INFO *const mbmi = xd->mi[0];
122   struct macroblockd_plane *const pd = &xd->plane[plane];
123   const int16_t *const dequant = pd->seg_dequant_QTX[mbmi->segment_id];
124   tran_low_t *const tcoeffs = dcb->dqcoeff_block[plane] + dcb->cb_offset[plane];
125   const int shift = av1_get_tx_scale(tx_size);
126   const int bwl = get_txb_bwl(tx_size);
127   const int width = get_txb_wide(tx_size);
128   const int height = get_txb_high(tx_size);
129   int cul_level = 0;
130   int dc_val = 0;
131   uint8_t levels_buf[TX_PAD_2D];
132   uint8_t *const levels = set_levels(levels_buf, width);
133   const int all_zero = aom_read_symbol(
134       r, ec_ctx->txb_skip_cdf[txs_ctx][txb_ctx->txb_skip_ctx], 2, ACCT_STR);
135   eob_info *eob_data = dcb->eob_data[plane] + dcb->txb_offset[plane];
136   uint16_t *const eob = &(eob_data->eob);
137   uint16_t *const max_scan_line = &(eob_data->max_scan_line);
138   *max_scan_line = 0;
139   *eob = 0;
140 
141 #if CONFIG_INSPECTION
142   if (plane == 0) {
143     const int txk_type_idx =
144         av1_get_txk_type_index(mbmi->bsize, blk_row, blk_col);
145     mbmi->tx_skip[txk_type_idx] = all_zero;
146   }
147 #endif
148 
149   if (all_zero) {
150     *max_scan_line = 0;
151     if (plane == 0) {
152       xd->tx_type_map[blk_row * xd->tx_type_map_stride + blk_col] = DCT_DCT;
153     }
154     return 0;
155   }
156 
157   if (plane == AOM_PLANE_Y) {
158     // only y plane's tx_type is transmitted
159     av1_read_tx_type(cm, xd, blk_row, blk_col, tx_size, r);
160   }
161   const TX_TYPE tx_type =
162       av1_get_tx_type(xd, plane_type, blk_row, blk_col, tx_size,
163                       cm->features.reduced_tx_set_used);
164   const TX_CLASS tx_class = tx_type_to_class[tx_type];
165   const qm_val_t *iqmatrix =
166       av1_get_iqmatrix(&cm->quant_params, xd, plane, tx_size, tx_type);
167   const SCAN_ORDER *const scan_order = get_scan(tx_size, tx_type);
168   const int16_t *const scan = scan_order->scan;
169   int eob_extra = 0;
170   int eob_pt = 1;
171 
172   const int eob_multi_size = txsize_log2_minus4[tx_size];
173   const int eob_multi_ctx = (tx_class == TX_CLASS_2D) ? 0 : 1;
174   switch (eob_multi_size) {
175     case 0:
176       eob_pt =
177           aom_read_symbol(r, ec_ctx->eob_flag_cdf16[plane_type][eob_multi_ctx],
178                           5, ACCT_STR) +
179           1;
180       break;
181     case 1:
182       eob_pt =
183           aom_read_symbol(r, ec_ctx->eob_flag_cdf32[plane_type][eob_multi_ctx],
184                           6, ACCT_STR) +
185           1;
186       break;
187     case 2:
188       eob_pt =
189           aom_read_symbol(r, ec_ctx->eob_flag_cdf64[plane_type][eob_multi_ctx],
190                           7, ACCT_STR) +
191           1;
192       break;
193     case 3:
194       eob_pt =
195           aom_read_symbol(r, ec_ctx->eob_flag_cdf128[plane_type][eob_multi_ctx],
196                           8, ACCT_STR) +
197           1;
198       break;
199     case 4:
200       eob_pt =
201           aom_read_symbol(r, ec_ctx->eob_flag_cdf256[plane_type][eob_multi_ctx],
202                           9, ACCT_STR) +
203           1;
204       break;
205     case 5:
206       eob_pt =
207           aom_read_symbol(r, ec_ctx->eob_flag_cdf512[plane_type][eob_multi_ctx],
208                           10, ACCT_STR) +
209           1;
210       break;
211     case 6:
212     default:
213       eob_pt = aom_read_symbol(
214                    r, ec_ctx->eob_flag_cdf1024[plane_type][eob_multi_ctx], 11,
215                    ACCT_STR) +
216                1;
217       break;
218   }
219 
220   const int eob_offset_bits = av1_eob_offset_bits[eob_pt];
221   if (eob_offset_bits > 0) {
222     const int eob_ctx = eob_pt - 3;
223     int bit = aom_read_symbol(
224         r, ec_ctx->eob_extra_cdf[txs_ctx][plane_type][eob_ctx], 2, ACCT_STR);
225     if (bit) {
226       eob_extra += (1 << (eob_offset_bits - 1));
227     }
228 
229     for (int i = 1; i < eob_offset_bits; i++) {
230       bit = aom_read_bit(r, ACCT_STR);
231       if (bit) {
232         eob_extra += (1 << (eob_offset_bits - 1 - i));
233       }
234     }
235   }
236   *eob = rec_eob_pos(eob_pt, eob_extra);
237 
238   if (*eob > 1) {
239     memset(levels_buf, 0,
240            sizeof(*levels_buf) *
241                ((width + TX_PAD_HOR) * (height + TX_PAD_VER) + TX_PAD_END));
242   }
243 
244   {
245     // Read the non-zero coefficient with scan index eob-1
246     // TODO(angiebird): Put this into a function
247     const int c = *eob - 1;
248     const int pos = scan[c];
249     const int coeff_ctx = get_lower_levels_ctx_eob(bwl, height, c);
250     const int nsymbs = 3;
251     aom_cdf_prob *cdf =
252         ec_ctx->coeff_base_eob_cdf[txs_ctx][plane_type][coeff_ctx];
253     int level = aom_read_symbol(r, cdf, nsymbs, ACCT_STR) + 1;
254     if (level > NUM_BASE_LEVELS) {
255       const int br_ctx = get_br_ctx_eob(pos, bwl, tx_class);
256       cdf = ec_ctx->coeff_br_cdf[AOMMIN(txs_ctx, TX_32X32)][plane_type][br_ctx];
257       for (int idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) {
258         const int k = aom_read_symbol(r, cdf, BR_CDF_SIZE, ACCT_STR);
259         level += k;
260         if (k < BR_CDF_SIZE - 1) break;
261       }
262     }
263     levels[get_padded_idx(pos, bwl)] = level;
264   }
265   if (*eob > 1) {
266     base_cdf_arr base_cdf = ec_ctx->coeff_base_cdf[txs_ctx][plane_type];
267     br_cdf_arr br_cdf =
268         ec_ctx->coeff_br_cdf[AOMMIN(txs_ctx, TX_32X32)][plane_type];
269     if (tx_class == TX_CLASS_2D) {
270       read_coeffs_reverse_2d(r, tx_size, 1, *eob - 1 - 1, scan, bwl, levels,
271                              base_cdf, br_cdf);
272       read_coeffs_reverse(r, tx_size, tx_class, 0, 0, scan, bwl, levels,
273                           base_cdf, br_cdf);
274     } else {
275       read_coeffs_reverse(r, tx_size, tx_class, 0, *eob - 1 - 1, scan, bwl,
276                           levels, base_cdf, br_cdf);
277     }
278   }
279 
280   for (int c = 0; c < *eob; ++c) {
281     const int pos = scan[c];
282     uint8_t sign;
283     tran_low_t level = levels[get_padded_idx(pos, bwl)];
284     if (level) {
285       *max_scan_line = AOMMAX(*max_scan_line, pos);
286       if (c == 0) {
287         const int dc_sign_ctx = txb_ctx->dc_sign_ctx;
288         sign = aom_read_symbol(r, ec_ctx->dc_sign_cdf[plane_type][dc_sign_ctx],
289                                2, ACCT_STR);
290       } else {
291         sign = aom_read_bit(r, ACCT_STR);
292       }
293       if (level >= MAX_BASE_BR_RANGE) {
294         level += read_golomb(xd, r);
295       }
296 
297       if (c == 0) dc_val = sign ? -level : level;
298 
299       // Bitmasking to clamp level to valid range:
300       //   The valid range for 8/10/12 bit vdieo is at most 14/16/18 bit
301       level &= 0xfffff;
302       cul_level += level;
303       tran_low_t dq_coeff;
304       // Bitmasking to clamp dq_coeff to valid range:
305       //   The valid range for 8/10/12 bit video is at most 17/19/21 bit
306       dq_coeff = (tran_low_t)(
307           (int64_t)level * get_dqv(dequant, scan[c], iqmatrix) & 0xffffff);
308       dq_coeff = dq_coeff >> shift;
309       if (sign) {
310         dq_coeff = -dq_coeff;
311       }
312       tcoeffs[pos] = clamp(dq_coeff, min_value, max_value);
313     }
314   }
315 
316   cul_level = AOMMIN(COEFF_CONTEXT_MASK, cul_level);
317 
318   // DC value
319   set_dc_sign(&cul_level, dc_val);
320 
321   return cul_level;
322 }
323 
av1_read_coeffs_txb_facade(const AV1_COMMON * const cm,DecoderCodingBlock * dcb,aom_reader * const r,const int plane,const int row,const int col,const TX_SIZE tx_size)324 void av1_read_coeffs_txb_facade(const AV1_COMMON *const cm,
325                                 DecoderCodingBlock *dcb, aom_reader *const r,
326                                 const int plane, const int row, const int col,
327                                 const TX_SIZE tx_size) {
328 #if TXCOEFF_TIMER
329   struct aom_usec_timer timer;
330   aom_usec_timer_start(&timer);
331 #endif
332   MACROBLOCKD *const xd = &dcb->xd;
333   MB_MODE_INFO *const mbmi = xd->mi[0];
334   struct macroblockd_plane *const pd = &xd->plane[plane];
335 
336   const BLOCK_SIZE bsize = mbmi->bsize;
337   assert(bsize < BLOCK_SIZES_ALL);
338   const BLOCK_SIZE plane_bsize =
339       get_plane_block_size(bsize, pd->subsampling_x, pd->subsampling_y);
340 
341   TXB_CTX txb_ctx;
342   get_txb_ctx(plane_bsize, tx_size, plane, pd->above_entropy_context + col,
343               pd->left_entropy_context + row, &txb_ctx);
344   const uint8_t cul_level =
345       av1_read_coeffs_txb(cm, dcb, r, row, col, plane, &txb_ctx, tx_size);
346   av1_set_entropy_contexts(xd, pd, plane, plane_bsize, tx_size, cul_level, col,
347                            row);
348 
349   if (is_inter_block(mbmi)) {
350     const PLANE_TYPE plane_type = get_plane_type(plane);
351     // tx_type will be read out in av1_read_coeffs_txb_facade
352     const TX_TYPE tx_type = av1_get_tx_type(xd, plane_type, row, col, tx_size,
353                                             cm->features.reduced_tx_set_used);
354 
355     if (plane == 0) {
356       const int txw = tx_size_wide_unit[tx_size];
357       const int txh = tx_size_high_unit[tx_size];
358       // The 16x16 unit is due to the constraint from tx_64x64 which sets the
359       // maximum tx size for chroma as 32x32. Coupled with 4x1 transform block
360       // size, the constraint takes effect in 32x16 / 16x32 size too. To solve
361       // the intricacy, cover all the 16x16 units inside a 64 level transform.
362       if (txw == tx_size_wide_unit[TX_64X64] ||
363           txh == tx_size_high_unit[TX_64X64]) {
364         const int tx_unit = tx_size_wide_unit[TX_16X16];
365         const int stride = xd->tx_type_map_stride;
366         for (int idy = 0; idy < txh; idy += tx_unit) {
367           for (int idx = 0; idx < txw; idx += tx_unit) {
368             xd->tx_type_map[(row + idy) * stride + col + idx] = tx_type;
369           }
370         }
371       }
372     }
373   }
374 
375 #if TXCOEFF_TIMER
376   aom_usec_timer_mark(&timer);
377   const int64_t elapsed_time = aom_usec_timer_elapsed(&timer);
378   cm->txcoeff_timer += elapsed_time;
379   ++cm->txb_count;
380 #endif
381 }
382