1 /*
2  * Copyright © 2018, VideoLAN and dav1d authors
3  * Copyright © 2018, Two Orioles, LLC
4  * All rights reserved.
5  *
6  * Redistribution and use in source and binary forms, with or without
7  * modification, are permitted provided that the following conditions are met:
8  *
9  * 1. Redistributions of source code must retain the above copyright notice, this
10  *    list of conditions and the following disclaimer.
11  *
12  * 2. Redistributions in binary form must reproduce the above copyright notice,
13  *    this list of conditions and the following disclaimer in the documentation
14  *    and/or other materials provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
17  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
20  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
23  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26  */
27 
28 #ifndef DAV1D_SRC_CDF_H
29 #define DAV1D_SRC_CDF_H
30 
31 #include <stdint.h>
32 
33 #include "src/levels.h"
34 #include "src/ref.h"
35 #include "src/thread_data.h"
36 
37 /* Buffers padded to [8] or [16] for SIMD where needed. */
38 
39 typedef struct CdfModeContext {
40     ALIGN(uint16_t y_mode[4][N_INTRA_PRED_MODES + 3], 32);
41     ALIGN(uint16_t uv_mode[2][N_INTRA_PRED_MODES][N_UV_INTRA_PRED_MODES + 2], 32);
42     ALIGN(uint16_t wedge_idx[9][16], 32);
43     ALIGN(uint16_t partition[N_BL_LEVELS][4][N_PARTITIONS + 6], 32);
44     ALIGN(uint16_t cfl_alpha[6][16], 32);
45     ALIGN(uint16_t txtp_inter1[2][16], 32);
46     ALIGN(uint16_t txtp_inter2[12 + 4], 32);
47     ALIGN(uint16_t txtp_intra1[2][N_INTRA_PRED_MODES][7 + 1], 16);
48     ALIGN(uint16_t txtp_intra2[3][N_INTRA_PRED_MODES][5 + 3], 16);
49     ALIGN(uint16_t cfl_sign[8], 16);
50     ALIGN(uint16_t angle_delta[8][8], 16);
51     ALIGN(uint16_t filter_intra[5 + 3], 16);
52     ALIGN(uint16_t comp_inter_mode[8][N_COMP_INTER_PRED_MODES], 16);
53     ALIGN(uint16_t seg_id[3][DAV1D_MAX_SEGMENTS], 16);
54     ALIGN(uint16_t pal_sz[2][7][7 + 1], 16);
55     ALIGN(uint16_t color_map[2][7][5][8], 16);
56     ALIGN(uint16_t filter[2][8][DAV1D_N_SWITCHABLE_FILTERS + 1], 8);
57     ALIGN(uint16_t txsz[N_TX_SIZES - 1][3][4], 8);
58     ALIGN(uint16_t motion_mode[N_BS_SIZES][3 + 1], 8);
59     ALIGN(uint16_t delta_q[4], 8);
60     ALIGN(uint16_t delta_lf[5][4], 8);
61     ALIGN(uint16_t interintra_mode[4][4], 8);
62     ALIGN(uint16_t restore_switchable[3 + 1], 8);
63     ALIGN(uint16_t restore_wiener[2], 4);
64     ALIGN(uint16_t restore_sgrproj[2], 4);
65     ALIGN(uint16_t interintra[7][2], 4);
66     ALIGN(uint16_t interintra_wedge[7][2], 4);
67     ALIGN(uint16_t txtp_inter3[4][2], 4);
68     ALIGN(uint16_t use_filter_intra[N_BS_SIZES][2], 4);
69     ALIGN(uint16_t newmv_mode[6][2], 4);
70     ALIGN(uint16_t globalmv_mode[2][2], 4);
71     ALIGN(uint16_t refmv_mode[6][2], 4);
72     ALIGN(uint16_t drl_bit[3][2], 4);
73     ALIGN(uint16_t intra[4][2], 4);
74     ALIGN(uint16_t comp[5][2], 4);
75     ALIGN(uint16_t comp_dir[5][2], 4);
76     ALIGN(uint16_t jnt_comp[6][2], 4);
77     ALIGN(uint16_t mask_comp[6][2], 4);
78     ALIGN(uint16_t wedge_comp[9][2], 4);
79     ALIGN(uint16_t ref[6][3][2], 4);
80     ALIGN(uint16_t comp_fwd_ref[3][3][2], 4);
81     ALIGN(uint16_t comp_bwd_ref[2][3][2], 4);
82     ALIGN(uint16_t comp_uni_ref[3][3][2], 4);
83     ALIGN(uint16_t txpart[7][3][2], 4);
84     ALIGN(uint16_t skip[3][2], 4);
85     ALIGN(uint16_t skip_mode[3][2], 4);
86     ALIGN(uint16_t seg_pred[3][2], 4);
87     ALIGN(uint16_t obmc[N_BS_SIZES][2], 4);
88     ALIGN(uint16_t pal_y[7][3][2], 4);
89     ALIGN(uint16_t pal_uv[2][2], 4);
90     ALIGN(uint16_t intrabc[2], 4);
91 } CdfModeContext;
92 
93 typedef struct CdfCoefContext {
94     ALIGN(uint16_t eob_bin_16[2][2][5 + 3], 16);
95     ALIGN(uint16_t eob_bin_32[2][2][6 + 2], 16);
96     ALIGN(uint16_t eob_bin_64[2][2][7 + 1], 16);
97     ALIGN(uint16_t eob_bin_128[2][2][8 + 0], 16);
98     ALIGN(uint16_t eob_bin_256[2][2][9 + 7], 32);
99     ALIGN(uint16_t eob_bin_512[2][10 + 6], 32);
100     ALIGN(uint16_t eob_bin_1024[2][11 + 5], 32);
101     ALIGN(uint16_t eob_base_tok[N_TX_SIZES][2][4][4], 8);
102     ALIGN(uint16_t base_tok[N_TX_SIZES][2][41][4], 8);
103     ALIGN(uint16_t br_tok[4 /*5*/][2][21][4], 8);
104     ALIGN(uint16_t eob_hi_bit[N_TX_SIZES][2][11 /*22*/][2], 4);
105     ALIGN(uint16_t skip[N_TX_SIZES][13][2], 4);
106     ALIGN(uint16_t dc_sign[2][3][2], 4);
107 } CdfCoefContext;
108 
109 typedef struct CdfMvComponent {
110     ALIGN(uint16_t classes[11 + 5], 32);
111     ALIGN(uint16_t class0_fp[2][4], 8);
112     ALIGN(uint16_t classN_fp[4], 8);
113     ALIGN(uint16_t class0_hp[2], 4);
114     ALIGN(uint16_t classN_hp[2], 4);
115     ALIGN(uint16_t class0[2], 4);
116     ALIGN(uint16_t classN[10][2], 4);
117     ALIGN(uint16_t sign[2], 4);
118 } CdfMvComponent;
119 
120 typedef struct CdfMvContext {
121     CdfMvComponent comp[2];
122     ALIGN(uint16_t joint[N_MV_JOINTS], 8);
123 } CdfMvContext;
124 
125 typedef struct CdfContext {
126     CdfModeContext m;
127     ALIGN(uint16_t kfym[5][5][N_INTRA_PRED_MODES + 3], 32);
128     CdfCoefContext coef;
129     CdfMvContext mv, dmv;
130 } CdfContext;
131 
132 typedef struct CdfThreadContext {
133     Dav1dRef *ref; ///< allocation origin
134     union {
135         CdfContext *cdf; // if ref != NULL
136         unsigned qcat; // if ref == NULL, from static CDF tables
137     } data;
138     struct thread_data *t;
139     atomic_uint *progress;
140 } CdfThreadContext;
141 
142 void dav1d_cdf_thread_init_static(CdfThreadContext *cdf, int qidx);
143 int dav1d_cdf_thread_alloc(Dav1dContext *c, CdfThreadContext *cdf,
144                            struct thread_data *t);
145 void dav1d_cdf_thread_copy(CdfContext *dst, const CdfThreadContext *src);
146 void dav1d_cdf_thread_ref(CdfThreadContext *dst, CdfThreadContext *src);
147 void dav1d_cdf_thread_unref(CdfThreadContext *cdf);
148 void dav1d_cdf_thread_update(const Dav1dFrameHeader *hdr, CdfContext *dst,
149                              const CdfContext *src);
150 
151 /*
152  * These are binary signals (so a signal is either "done" or "not done").
153  */
154 void dav1d_cdf_thread_wait(CdfThreadContext *cdf);
155 void dav1d_cdf_thread_signal(CdfThreadContext *cdf);
156 
157 #endif /* DAV1D_SRC_CDF_H */
158