3 |
* XVID MPEG-4 VIDEO CODEC |
* XVID MPEG-4 VIDEO CODEC |
4 |
* - 8bit<->16bit transfer - |
* - 8bit<->16bit transfer - |
5 |
* |
* |
6 |
* Copyright(C) 2001-2002 Peter Ross <pross@xvid.org> |
* Copyright(C) 2001-2003 Peter Ross <pross@xvid.org> |
7 |
* |
* |
8 |
* This file is part of XviD, a free MPEG-4 video encoder/decoder |
* This program is free software ; you can redistribute it and/or modify |
9 |
* |
* it under the terms of the GNU General Public License as published by |
|
* XviD is free software; you can redistribute it and/or modify it |
|
|
* under the terms of the GNU General Public License as published by |
|
10 |
* the Free Software Foundation; either version 2 of the License, or |
* the Free Software Foundation; either version 2 of the License, or |
11 |
* (at your option) any later version. |
* (at your option) any later version. |
12 |
* |
* |
19 |
* along with this program; if not, write to the Free Software |
* along with this program; if not, write to the Free Software |
20 |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA |
21 |
* |
* |
|
* Under section 8 of the GNU General Public License, the copyright |
|
|
* holders of XVID explicitly forbid distribution in the following |
|
|
* countries: |
|
|
* |
|
|
* - Japan |
|
|
* - United States of America |
|
|
* |
|
|
* Linking XviD statically or dynamically with other modules is making a |
|
|
* combined work based on XviD. Thus, the terms and conditions of the |
|
|
* GNU General Public License cover the whole combination. |
|
|
* |
|
|
* As a special exception, the copyright holders of XviD give you |
|
|
* permission to link XviD with independent modules that communicate with |
|
|
* XviD solely through the VFW1.1 and DShow interfaces, regardless of the |
|
|
* license terms of these independent modules, and to copy and distribute |
|
|
* the resulting combined work under terms of your choice, provided that |
|
|
* every copy of the combined work is accompanied by a complete copy of |
|
|
* the source code of XviD (the version of XviD used to produce the |
|
|
* combined work), being distributed under the terms of the GNU General |
|
|
* Public License plus this exception. An independent module is a module |
|
|
* which is not derived from or based on XviD. |
|
|
* |
|
|
* Note that people who make modified versions of XviD are not obligated |
|
|
* to grant this special exception for their modified versions; it is |
|
|
* their choice whether to do so. The GNU General Public License gives |
|
|
* permission to release a modified version without this exception; this |
|
|
* exception also makes it possible to release a modified version which |
|
|
* carries forward this exception. |
|
|
* |
|
22 |
* $Id$ |
* $Id$ |
23 |
* |
* |
24 |
****************************************************************************/ |
****************************************************************************/ |
32 |
TRANSFER_16TO8COPY_PTR transfer_16to8copy; |
TRANSFER_16TO8COPY_PTR transfer_16to8copy; |
33 |
|
|
34 |
TRANSFER_8TO16SUB_PTR transfer_8to16sub; |
TRANSFER_8TO16SUB_PTR transfer_8to16sub; |
35 |
|
TRANSFER_8TO16SUBRO_PTR transfer_8to16subro; |
36 |
TRANSFER_8TO16SUB2_PTR transfer_8to16sub2; |
TRANSFER_8TO16SUB2_PTR transfer_8to16sub2; |
37 |
|
TRANSFER_8TO16SUB2RO_PTR transfer_8to16sub2ro; |
38 |
TRANSFER_16TO8ADD_PTR transfer_16to8add; |
TRANSFER_16TO8ADD_PTR transfer_16to8add; |
39 |
|
|
40 |
TRANSFER8X8_COPY_PTR transfer8x8_copy; |
TRANSFER8X8_COPY_PTR transfer8x8_copy; |
41 |
|
|
42 |
|
#define USE_REFERENCE_C |
43 |
|
|
44 |
/***************************************************************************** |
/***************************************************************************** |
45 |
* |
* |
66 |
const uint8_t * const src, |
const uint8_t * const src, |
67 |
uint32_t stride) |
uint32_t stride) |
68 |
{ |
{ |
69 |
uint32_t i, j; |
int i, j; |
|
|
|
70 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; j++) { |
71 |
for (i = 0; i < 8; i++) { |
for (i = 0; i < 8; i++) { |
72 |
dst[j * 8 + i] = (int16_t) src[j * stride + i]; |
dst[j * 8 + i] = (int16_t) src[j * stride + i]; |
88 |
const int16_t * const src, |
const int16_t * const src, |
89 |
uint32_t stride) |
uint32_t stride) |
90 |
{ |
{ |
91 |
uint32_t i, j; |
int i, j; |
92 |
|
|
93 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; j++) { |
94 |
for (i = 0; i < 8; i++) { |
for (i = 0; i < 8; i++) { |
95 |
|
#ifdef USE_REFERENCE_C |
96 |
int16_t pixel = src[j * 8 + i]; |
int16_t pixel = src[j * 8 + i]; |
97 |
|
|
98 |
if (pixel < 0) { |
if (pixel < 0) { |
101 |
pixel = 255; |
pixel = 255; |
102 |
} |
} |
103 |
dst[j * stride + i] = (uint8_t) pixel; |
dst[j * stride + i] = (uint8_t) pixel; |
104 |
|
#else |
105 |
|
const int16_t pixel = src[j * 8 + i]; |
106 |
|
const uint8_t value = (uint8_t)( (pixel&~255) ? (-pixel)>>(8*sizeof(pixel)-1) : pixel ); |
107 |
|
dst[j*stride + i] = value; |
108 |
|
#endif |
109 |
} |
} |
110 |
} |
} |
111 |
} |
} |
130 |
const uint8_t * ref, |
const uint8_t * ref, |
131 |
const uint32_t stride) |
const uint32_t stride) |
132 |
{ |
{ |
133 |
uint32_t i, j; |
int i, j; |
134 |
|
|
135 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; j++) { |
136 |
for (i = 0; i < 8; i++) { |
for (i = 0; i < 8; i++) { |
137 |
uint8_t c = cur[j * stride + i]; |
const uint8_t c = cur[j * stride + i]; |
138 |
uint8_t r = ref[j * stride + i]; |
const uint8_t r = ref[j * stride + i]; |
139 |
|
|
140 |
cur[j * stride + i] = r; |
cur[j * stride + i] = r; |
141 |
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
144 |
} |
} |
145 |
|
|
146 |
|
|
147 |
|
void |
148 |
|
transfer_8to16subro_c(int16_t * const dct, |
149 |
|
const uint8_t * const cur, |
150 |
|
const uint8_t * ref, |
151 |
|
const uint32_t stride) |
152 |
|
{ |
153 |
|
int i, j; |
154 |
|
|
155 |
|
for (j = 0; j < 8; j++) { |
156 |
|
for (i = 0; i < 8; i++) { |
157 |
|
const uint8_t c = cur[j * stride + i]; |
158 |
|
const uint8_t r = ref[j * stride + i]; |
159 |
|
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
160 |
|
} |
161 |
|
} |
162 |
|
} |
163 |
|
|
164 |
|
|
165 |
|
|
166 |
/* |
/* |
167 |
* C - the current buffer |
* C - the current buffer |
168 |
* R1 - the 1st reference buffer |
* R1 - the 1st reference buffer |
173 |
* |
* |
174 |
* R1 (8bit) = R1 |
* R1 (8bit) = R1 |
175 |
* R2 (8bit) = R2 |
* R2 (8bit) = R2 |
176 |
* C (8bit) = C |
* R (temp) = min((R1 + R2)/2, 255) |
177 |
* DCT (16bit)= C - min((R1 + R2)/2, 255) |
* DCT (16bit)= C - R |
178 |
|
* C (8bit) = R |
179 |
*/ |
*/ |
180 |
void |
void |
181 |
transfer_8to16sub2_c(int16_t * const dct, |
transfer_8to16sub2_c(int16_t * const dct, |
188 |
|
|
189 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; j++) { |
190 |
for (i = 0; i < 8; i++) { |
for (i = 0; i < 8; i++) { |
191 |
uint8_t c = cur[j * stride + i]; |
const uint8_t c = cur[j * stride + i]; |
192 |
int r = (ref1[j * stride + i] + ref2[j * stride + i] + 1) / 2; |
const uint8_t r = (ref1[j * stride + i] + ref2[j * stride + i] + 1) >> 1; |
193 |
|
cur[j * stride + i] = r; |
194 |
if (r > 255) { |
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
|
r = 255; |
|
195 |
} |
} |
196 |
/*cur[j * stride + i] = r; */ |
} |
197 |
|
} |
198 |
|
|
199 |
|
void |
200 |
|
transfer_8to16sub2ro_c(int16_t * const dct, |
201 |
|
const uint8_t * const cur, |
202 |
|
const uint8_t * ref1, |
203 |
|
const uint8_t * ref2, |
204 |
|
const uint32_t stride) |
205 |
|
{ |
206 |
|
uint32_t i, j; |
207 |
|
|
208 |
|
for (j = 0; j < 8; j++) { |
209 |
|
for (i = 0; i < 8; i++) { |
210 |
|
const uint8_t c = cur[j * stride + i]; |
211 |
|
const uint8_t r = (ref1[j * stride + i] + ref2[j * stride + i] + 1) >> 1; |
212 |
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
dct[j * 8 + i] = (int16_t) c - (int16_t) r; |
213 |
} |
} |
214 |
} |
} |
229 |
const int16_t * const src, |
const int16_t * const src, |
230 |
uint32_t stride) |
uint32_t stride) |
231 |
{ |
{ |
232 |
uint32_t i, j; |
int i, j; |
233 |
|
|
234 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; j++) { |
235 |
for (i = 0; i < 8; i++) { |
for (i = 0; i < 8; i++) { |
236 |
|
#ifdef USE_REFERENCE_C |
237 |
int16_t pixel = (int16_t) dst[j * stride + i] + src[j * 8 + i]; |
int16_t pixel = (int16_t) dst[j * stride + i] + src[j * 8 + i]; |
238 |
|
|
239 |
if (pixel < 0) { |
if (pixel < 0) { |
242 |
pixel = 255; |
pixel = 255; |
243 |
} |
} |
244 |
dst[j * stride + i] = (uint8_t) pixel; |
dst[j * stride + i] = (uint8_t) pixel; |
245 |
|
#else |
246 |
|
const int16_t pixel = (int16_t) dst[j * stride + i] + src[j * 8 + i]; |
247 |
|
const uint8_t value = (uint8_t)( (pixel&~255) ? (-pixel)>>(8*sizeof(pixel)-1) : pixel ); |
248 |
|
dst[j*stride + i] = value; |
249 |
|
#endif |
250 |
|
|
251 |
} |
} |
252 |
} |
} |
253 |
} |
} |
266 |
const uint8_t * const src, |
const uint8_t * const src, |
267 |
const uint32_t stride) |
const uint32_t stride) |
268 |
{ |
{ |
269 |
uint32_t i, j; |
int j, i; |
270 |
|
|
271 |
for (j = 0; j < 8; j++) { |
for (j = 0; j < 8; ++j) { |
272 |
for (i = 0; i < 8; i++) { |
uint8_t *d = dst + j*stride; |
273 |
dst[j * stride + i] = src[j * stride + i]; |
const uint8_t *s = src + j*stride; |
274 |
|
|
275 |
|
for (i = 0; i < 8; ++i) |
276 |
|
{ |
277 |
|
*d++ = *s++; |
278 |
} |
} |
279 |
} |
} |
280 |
} |
} |