1 // Copyright 2011 Google Inc. All Rights Reserved.
2 //
3 // Use of this source code is governed by a BSD-style license
4 // that can be found in the COPYING file in the root of the source
5 // tree. An additional intellectual property rights grant can be found
6 // in the file PATENTS. All contributing project authors may
7 // be found in the AUTHORS file in the root of the source tree.
8 // -----------------------------------------------------------------------------
9 //
10 // Cost tables for level and modes
11 //
12 // Author: Skal (pascal.massimino@gmail.com)
13
14 #include "./cost.h"
15
16 //------------------------------------------------------------------------------
17 // Level cost tables
18
19 // For each given level, the following table gives the pattern of contexts to
20 // use for coding it (in [][0]) as well as the bit value to use for each
21 // context (in [][1]).
22 const uint16_t VP8LevelCodes[MAX_VARIABLE_LEVEL][2] = {
23 {0x001, 0x000}, {0x007, 0x001}, {0x00f, 0x005},
24 {0x00f, 0x00d}, {0x033, 0x003}, {0x033, 0x003}, {0x033, 0x023},
25 {0x033, 0x023}, {0x033, 0x023}, {0x033, 0x023}, {0x0d3, 0x013},
26 {0x0d3, 0x013}, {0x0d3, 0x013}, {0x0d3, 0x013}, {0x0d3, 0x013},
27 {0x0d3, 0x013}, {0x0d3, 0x013}, {0x0d3, 0x013}, {0x0d3, 0x093},
28 {0x0d3, 0x093}, {0x0d3, 0x093}, {0x0d3, 0x093}, {0x0d3, 0x093},
29 {0x0d3, 0x093}, {0x0d3, 0x093}, {0x0d3, 0x093}, {0x0d3, 0x093},
30 {0x0d3, 0x093}, {0x0d3, 0x093}, {0x0d3, 0x093}, {0x0d3, 0x093},
31 {0x0d3, 0x093}, {0x0d3, 0x093}, {0x0d3, 0x093}, {0x153, 0x053},
32 {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053},
33 {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053},
34 {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053},
35 {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053},
36 {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053},
37 {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053},
38 {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053},
39 {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x053}, {0x153, 0x153}
40 };
41
VariableLevelCost(int level,const uint8_t probas[NUM_PROBAS])42 static int VariableLevelCost(int level, const uint8_t probas[NUM_PROBAS]) {
43 int pattern = VP8LevelCodes[level - 1][0];
44 int bits = VP8LevelCodes[level - 1][1];
45 int cost = 0;
46 int i;
47 for (i = 2; pattern; ++i) {
48 if (pattern & 1) {
49 cost += VP8BitCost(bits & 1, probas[i]);
50 }
51 bits >>= 1;
52 pattern >>= 1;
53 }
54 return cost;
55 }
56
57 //------------------------------------------------------------------------------
58 // Pre-calc level costs once for all
59
VP8CalculateLevelCosts(VP8EncProba * const proba)60 void VP8CalculateLevelCosts(VP8EncProba* const proba) {
61 int ctype, band, ctx;
62
63 if (!proba->dirty_) return; // nothing to do.
64
65 for (ctype = 0; ctype < NUM_TYPES; ++ctype) {
66 int n;
67 for (band = 0; band < NUM_BANDS; ++band) {
68 for (ctx = 0; ctx < NUM_CTX; ++ctx) {
69 const uint8_t* const p = proba->coeffs_[ctype][band][ctx];
70 uint16_t* const table = proba->level_cost_[ctype][band][ctx];
71 const int cost0 = (ctx > 0) ? VP8BitCost(1, p[0]) : 0;
72 const int cost_base = VP8BitCost(1, p[1]) + cost0;
73 int v;
74 table[0] = VP8BitCost(0, p[1]) + cost0;
75 for (v = 1; v <= MAX_VARIABLE_LEVEL; ++v) {
76 table[v] = cost_base + VariableLevelCost(v, p);
77 }
78 // Starting at level 67 and up, the variable part of the cost is
79 // actually constant.
80 }
81 }
82 for (n = 0; n < 16; ++n) { // replicate bands. We don't need to sentinel.
83 for (ctx = 0; ctx < NUM_CTX; ++ctx) {
84 proba->remapped_costs_[ctype][n][ctx] =
85 proba->level_cost_[ctype][VP8EncBands[n]][ctx];
86 }
87 }
88 }
89 proba->dirty_ = 0;
90 }
91
92 //------------------------------------------------------------------------------
93 // Mode cost tables.
94
95 // These are the fixed probabilities (in the coding trees) turned into bit-cost
96 // by calling VP8BitCost().
97 const uint16_t VP8FixedCostsUV[4] = { 302, 984, 439, 642 };
98 // note: these values include the fixed VP8BitCost(1, 145) mode selection cost.
99 const uint16_t VP8FixedCostsI16[4] = { 663, 919, 872, 919 };
100 const uint16_t VP8FixedCostsI4[NUM_BMODES][NUM_BMODES][NUM_BMODES] = {
101 { { 40, 1151, 1723, 1874, 2103, 2019, 1628, 1777, 2226, 2137 },
102 { 192, 469, 1296, 1308, 1849, 1794, 1781, 1703, 1713, 1522 },
103 { 142, 910, 762, 1684, 1849, 1576, 1460, 1305, 1801, 1657 },
104 { 559, 641, 1370, 421, 1182, 1569, 1612, 1725, 863, 1007 },
105 { 299, 1059, 1256, 1108, 636, 1068, 1581, 1883, 869, 1142 },
106 { 277, 1111, 707, 1362, 1089, 672, 1603, 1541, 1545, 1291 },
107 { 214, 781, 1609, 1303, 1632, 2229, 726, 1560, 1713, 918 },
108 { 152, 1037, 1046, 1759, 1983, 2174, 1358, 742, 1740, 1390 },
109 { 512, 1046, 1420, 753, 752, 1297, 1486, 1613, 460, 1207 },
110 { 424, 827, 1362, 719, 1462, 1202, 1199, 1476, 1199, 538 } },
111 { { 240, 402, 1134, 1491, 1659, 1505, 1517, 1555, 1979, 2099 },
112 { 467, 242, 960, 1232, 1714, 1620, 1834, 1570, 1676, 1391 },
113 { 500, 455, 463, 1507, 1699, 1282, 1564, 982, 2114, 2114 },
114 { 672, 643, 1372, 331, 1589, 1667, 1453, 1938, 996, 876 },
115 { 458, 783, 1037, 911, 738, 968, 1165, 1518, 859, 1033 },
116 { 504, 815, 504, 1139, 1219, 719, 1506, 1085, 1268, 1268 },
117 { 333, 630, 1445, 1239, 1883, 3672, 799, 1548, 1865, 598 },
118 { 399, 644, 746, 1342, 1856, 1350, 1493, 613, 1855, 1015 },
119 { 622, 749, 1205, 608, 1066, 1408, 1290, 1406, 546, 971 },
120 { 500, 753, 1041, 668, 1230, 1617, 1297, 1425, 1383, 523 } },
121 { { 394, 553, 523, 1502, 1536, 981, 1608, 1142, 1666, 2181 },
122 { 655, 430, 375, 1411, 1861, 1220, 1677, 1135, 1978, 1553 },
123 { 690, 640, 245, 1954, 2070, 1194, 1528, 982, 1972, 2232 },
124 { 559, 834, 741, 867, 1131, 980, 1225, 852, 1092, 784 },
125 { 690, 875, 516, 959, 673, 894, 1056, 1190, 1528, 1126 },
126 { 740, 951, 384, 1277, 1177, 492, 1579, 1155, 1846, 1513 },
127 { 323, 775, 1062, 1776, 3062, 1274, 813, 1188, 1372, 655 },
128 { 488, 971, 484, 1767, 1515, 1775, 1115, 503, 1539, 1461 },
129 { 740, 1006, 998, 709, 851, 1230, 1337, 788, 741, 721 },
130 { 522, 1073, 573, 1045, 1346, 887, 1046, 1146, 1203, 697 } },
131 { { 105, 864, 1442, 1009, 1934, 1840, 1519, 1920, 1673, 1579 },
132 { 534, 305, 1193, 683, 1388, 2164, 1802, 1894, 1264, 1170 },
133 { 305, 518, 877, 1108, 1426, 3215, 1425, 1064, 1320, 1242 },
134 { 683, 732, 1927, 257, 1493, 2048, 1858, 1552, 1055, 947 },
135 { 394, 814, 1024, 660, 959, 1556, 1282, 1289, 893, 1047 },
136 { 528, 615, 996, 940, 1201, 635, 1094, 2515, 803, 1358 },
137 { 347, 614, 1609, 1187, 3133, 1345, 1007, 1339, 1017, 667 },
138 { 218, 740, 878, 1605, 3650, 3650, 1345, 758, 1357, 1617 },
139 { 672, 750, 1541, 558, 1257, 1599, 1870, 2135, 402, 1087 },
140 { 592, 684, 1161, 430, 1092, 1497, 1475, 1489, 1095, 822 } },
141 { { 228, 1056, 1059, 1368, 752, 982, 1512, 1518, 987, 1782 },
142 { 494, 514, 818, 942, 965, 892, 1610, 1356, 1048, 1363 },
143 { 512, 648, 591, 1042, 761, 991, 1196, 1454, 1309, 1463 },
144 { 683, 749, 1043, 676, 841, 1396, 1133, 1138, 654, 939 },
145 { 622, 1101, 1126, 994, 361, 1077, 1203, 1318, 877, 1219 },
146 { 631, 1068, 857, 1650, 651, 477, 1650, 1419, 828, 1170 },
147 { 555, 727, 1068, 1335, 3127, 1339, 820, 1331, 1077, 429 },
148 { 504, 879, 624, 1398, 889, 889, 1392, 808, 891, 1406 },
149 { 683, 1602, 1289, 977, 578, 983, 1280, 1708, 406, 1122 },
150 { 399, 865, 1433, 1070, 1072, 764, 968, 1477, 1223, 678 } },
151 { { 333, 760, 935, 1638, 1010, 529, 1646, 1410, 1472, 2219 },
152 { 512, 494, 750, 1160, 1215, 610, 1870, 1868, 1628, 1169 },
153 { 572, 646, 492, 1934, 1208, 603, 1580, 1099, 1398, 1995 },
154 { 786, 789, 942, 581, 1018, 951, 1599, 1207, 731, 768 },
155 { 690, 1015, 672, 1078, 582, 504, 1693, 1438, 1108, 2897 },
156 { 768, 1267, 571, 2005, 1243, 244, 2881, 1380, 1786, 1453 },
157 { 452, 899, 1293, 903, 1311, 3100, 465, 1311, 1319, 813 },
158 { 394, 927, 942, 1103, 1358, 1104, 946, 593, 1363, 1109 },
159 { 559, 1005, 1007, 1016, 658, 1173, 1021, 1164, 623, 1028 },
160 { 564, 796, 632, 1005, 1014, 863, 2316, 1268, 938, 764 } },
161 { { 266, 606, 1098, 1228, 1497, 1243, 948, 1030, 1734, 1461 },
162 { 366, 585, 901, 1060, 1407, 1247, 876, 1134, 1620, 1054 },
163 { 452, 565, 542, 1729, 1479, 1479, 1016, 886, 2938, 1150 },
164 { 555, 1088, 1533, 950, 1354, 895, 834, 1019, 1021, 496 },
165 { 704, 815, 1193, 971, 973, 640, 1217, 2214, 832, 578 },
166 { 672, 1245, 579, 871, 875, 774, 872, 1273, 1027, 949 },
167 { 296, 1134, 2050, 1784, 1636, 3425, 442, 1550, 2076, 722 },
168 { 342, 982, 1259, 1846, 1848, 1848, 622, 568, 1847, 1052 },
169 { 555, 1064, 1304, 828, 746, 1343, 1075, 1329, 1078, 494 },
170 { 288, 1167, 1285, 1174, 1639, 1639, 833, 2254, 1304, 509 } },
171 { { 342, 719, 767, 1866, 1757, 1270, 1246, 550, 1746, 2151 },
172 { 483, 653, 694, 1509, 1459, 1410, 1218, 507, 1914, 1266 },
173 { 488, 757, 447, 2979, 1813, 1268, 1654, 539, 1849, 2109 },
174 { 522, 1097, 1085, 851, 1365, 1111, 851, 901, 961, 605 },
175 { 709, 716, 841, 728, 736, 945, 941, 862, 2845, 1057 },
176 { 512, 1323, 500, 1336, 1083, 681, 1342, 717, 1604, 1350 },
177 { 452, 1155, 1372, 1900, 1501, 3290, 311, 944, 1919, 922 },
178 { 403, 1520, 977, 2132, 1733, 3522, 1076, 276, 3335, 1547 },
179 { 559, 1374, 1101, 615, 673, 2462, 974, 795, 984, 984 },
180 { 547, 1122, 1062, 812, 1410, 951, 1140, 622, 1268, 651 } },
181 { { 165, 982, 1235, 938, 1334, 1366, 1659, 1578, 964, 1612 },
182 { 592, 422, 925, 847, 1139, 1112, 1387, 2036, 861, 1041 },
183 { 403, 837, 732, 770, 941, 1658, 1250, 809, 1407, 1407 },
184 { 896, 874, 1071, 381, 1568, 1722, 1437, 2192, 480, 1035 },
185 { 640, 1098, 1012, 1032, 684, 1382, 1581, 2106, 416, 865 },
186 { 559, 1005, 819, 914, 710, 770, 1418, 920, 838, 1435 },
187 { 415, 1258, 1245, 870, 1278, 3067, 770, 1021, 1287, 522 },
188 { 406, 990, 601, 1009, 1265, 1265, 1267, 759, 1017, 1277 },
189 { 968, 1182, 1329, 788, 1032, 1292, 1705, 1714, 203, 1403 },
190 { 732, 877, 1279, 471, 901, 1161, 1545, 1294, 755, 755 } },
191 { { 111, 931, 1378, 1185, 1933, 1648, 1148, 1714, 1873, 1307 },
192 { 406, 414, 1030, 1023, 1910, 1404, 1313, 1647, 1509, 793 },
193 { 342, 640, 575, 1088, 1241, 1349, 1161, 1350, 1756, 1502 },
194 { 559, 766, 1185, 357, 1682, 1428, 1329, 1897, 1219, 802 },
195 { 473, 909, 1164, 771, 719, 2508, 1427, 1432, 722, 782 },
196 { 342, 892, 785, 1145, 1150, 794, 1296, 1550, 973, 1057 },
197 { 208, 1036, 1326, 1343, 1606, 3395, 815, 1455, 1618, 712 },
198 { 228, 928, 890, 1046, 3499, 1711, 994, 829, 1720, 1318 },
199 { 768, 724, 1058, 636, 991, 1075, 1319, 1324, 616, 825 },
200 { 305, 1167, 1358, 899, 1587, 1587, 987, 1988, 1332, 501 } }
201 };
202
203 //------------------------------------------------------------------------------
204 // helper functions for residuals struct VP8Residual.
205
VP8InitResidual(int first,int coeff_type,VP8Encoder * const enc,VP8Residual * const res)206 void VP8InitResidual(int first, int coeff_type,
207 VP8Encoder* const enc, VP8Residual* const res) {
208 res->coeff_type = coeff_type;
209 res->prob = enc->proba_.coeffs_[coeff_type];
210 res->stats = enc->proba_.stats_[coeff_type];
211 res->costs = enc->proba_.remapped_costs_[coeff_type];
212 res->first = first;
213 }
214
215 //------------------------------------------------------------------------------
216 // Mode costs
217
VP8GetCostLuma4(VP8EncIterator * const it,const int16_t levels[16])218 int VP8GetCostLuma4(VP8EncIterator* const it, const int16_t levels[16]) {
219 const int x = (it->i4_ & 3), y = (it->i4_ >> 2);
220 VP8Residual res;
221 VP8Encoder* const enc = it->enc_;
222 int R = 0;
223 int ctx;
224
225 VP8InitResidual(0, 3, enc, &res);
226 ctx = it->top_nz_[x] + it->left_nz_[y];
227 VP8SetResidualCoeffs(levels, &res);
228 R += VP8GetResidualCost(ctx, &res);
229 return R;
230 }
231
VP8GetCostLuma16(VP8EncIterator * const it,const VP8ModeScore * const rd)232 int VP8GetCostLuma16(VP8EncIterator* const it, const VP8ModeScore* const rd) {
233 VP8Residual res;
234 VP8Encoder* const enc = it->enc_;
235 int x, y;
236 int R = 0;
237
238 VP8IteratorNzToBytes(it); // re-import the non-zero context
239
240 // DC
241 VP8InitResidual(0, 1, enc, &res);
242 VP8SetResidualCoeffs(rd->y_dc_levels, &res);
243 R += VP8GetResidualCost(it->top_nz_[8] + it->left_nz_[8], &res);
244
245 // AC
246 VP8InitResidual(1, 0, enc, &res);
247 for (y = 0; y < 4; ++y) {
248 for (x = 0; x < 4; ++x) {
249 const int ctx = it->top_nz_[x] + it->left_nz_[y];
250 VP8SetResidualCoeffs(rd->y_ac_levels[x + y * 4], &res);
251 R += VP8GetResidualCost(ctx, &res);
252 it->top_nz_[x] = it->left_nz_[y] = (res.last >= 0);
253 }
254 }
255 return R;
256 }
257
VP8GetCostUV(VP8EncIterator * const it,const VP8ModeScore * const rd)258 int VP8GetCostUV(VP8EncIterator* const it, const VP8ModeScore* const rd) {
259 VP8Residual res;
260 VP8Encoder* const enc = it->enc_;
261 int ch, x, y;
262 int R = 0;
263
264 VP8IteratorNzToBytes(it); // re-import the non-zero context
265
266 VP8InitResidual(0, 2, enc, &res);
267 for (ch = 0; ch <= 2; ch += 2) {
268 for (y = 0; y < 2; ++y) {
269 for (x = 0; x < 2; ++x) {
270 const int ctx = it->top_nz_[4 + ch + x] + it->left_nz_[4 + ch + y];
271 VP8SetResidualCoeffs(rd->uv_levels[ch * 2 + x + y * 2], &res);
272 R += VP8GetResidualCost(ctx, &res);
273 it->top_nz_[4 + ch + x] = it->left_nz_[4 + ch + y] = (res.last >= 0);
274 }
275 }
276 }
277 return R;
278 }
279
280
281 //------------------------------------------------------------------------------
282 // Recording of token probabilities.
283
284 // Record proba context used
Record(int bit,proba_t * const stats)285 static int Record(int bit, proba_t* const stats) {
286 proba_t p = *stats;
287 if (p >= 0xffff0000u) { // an overflow is inbound.
288 p = ((p + 1u) >> 1) & 0x7fff7fffu; // -> divide the stats by 2.
289 }
290 // record bit count (lower 16 bits) and increment total count (upper 16 bits).
291 p += 0x00010000u + bit;
292 *stats = p;
293 return bit;
294 }
295
296 // We keep the table-free variant around for reference, in case.
297 #define USE_LEVEL_CODE_TABLE
298
299 // Simulate block coding, but only record statistics.
300 // Note: no need to record the fixed probas.
VP8RecordCoeffs(int ctx,const VP8Residual * const res)301 int VP8RecordCoeffs(int ctx, const VP8Residual* const res) {
302 int n = res->first;
303 // should be stats[VP8EncBands[n]], but it's equivalent for n=0 or 1
304 proba_t* s = res->stats[n][ctx];
305 if (res->last < 0) {
306 Record(0, s + 0);
307 return 0;
308 }
309 while (n <= res->last) {
310 int v;
311 Record(1, s + 0); // order of record doesn't matter
312 while ((v = res->coeffs[n++]) == 0) {
313 Record(0, s + 1);
314 s = res->stats[VP8EncBands[n]][0];
315 }
316 Record(1, s + 1);
317 if (!Record(2u < (unsigned int)(v + 1), s + 2)) { // v = -1 or 1
318 s = res->stats[VP8EncBands[n]][1];
319 } else {
320 v = abs(v);
321 #if !defined(USE_LEVEL_CODE_TABLE)
322 if (!Record(v > 4, s + 3)) {
323 if (Record(v != 2, s + 4))
324 Record(v == 4, s + 5);
325 } else if (!Record(v > 10, s + 6)) {
326 Record(v > 6, s + 7);
327 } else if (!Record((v >= 3 + (8 << 2)), s + 8)) {
328 Record((v >= 3 + (8 << 1)), s + 9);
329 } else {
330 Record((v >= 3 + (8 << 3)), s + 10);
331 }
332 #else
333 if (v > MAX_VARIABLE_LEVEL) {
334 v = MAX_VARIABLE_LEVEL;
335 }
336
337 {
338 const int bits = VP8LevelCodes[v - 1][1];
339 int pattern = VP8LevelCodes[v - 1][0];
340 int i;
341 for (i = 0; (pattern >>= 1) != 0; ++i) {
342 const int mask = 2 << i;
343 if (pattern & 1) Record(!!(bits & mask), s + 3 + i);
344 }
345 }
346 #endif
347 s = res->stats[VP8EncBands[n]][2];
348 }
349 }
350 if (n < 16) Record(0, s + 0);
351 return 1;
352 }
353
354 //------------------------------------------------------------------------------
355