VO, AO: remove obsolete/problematic VO/AO drivers
[mplayer.git] / libvo / osd.c
blob95d094bb6eadc878fb692323ab560f9b97a291b0
1 /*
2 * generic alpha renderers for all YUV modes and RGB depths
3 * These are "reference implementations", should be optimized later (MMX, etc).
4 * templating code by Michael Niedermayer (michaelni@gmx.at)
6 * This file is part of MPlayer.
8 * MPlayer is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 2 of the License, or
11 * (at your option) any later version.
13 * MPlayer is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
18 * You should have received a copy of the GNU General Public License along
19 * with MPlayer; if not, write to the Free Software Foundation, Inc.,
20 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
23 //#define FAST_OSD
24 //#define FAST_OSD_TABLE
26 #include "config.h"
27 #include "osd.h"
28 #include "mp_msg.h"
29 #include <inttypes.h>
30 #include "cpudetect.h"
32 #if ARCH_X86
33 static const uint64_t bFF __attribute__((aligned(8))) = 0xFFFFFFFFFFFFFFFFULL;
34 static const unsigned long long mask24lh __attribute__((aligned(8))) = 0xFFFF000000000000ULL;
35 static const unsigned long long mask24hl __attribute__((aligned(8))) = 0x0000FFFFFFFFFFFFULL;
36 #endif
38 //Note: we have C, X86-nommx, MMX, MMX2, 3DNOW version therse no 3DNOW+MMX2 one
39 //Plain C versions
40 #if !HAVE_MMX || CONFIG_RUNTIME_CPUDETECT
41 #define COMPILE_C
42 #endif
44 #if ARCH_X86
46 #if (HAVE_MMX && !HAVE_AMD3DNOW && !HAVE_MMX2) || CONFIG_RUNTIME_CPUDETECT
47 #define COMPILE_MMX
48 #endif
50 #if HAVE_MMX2 || CONFIG_RUNTIME_CPUDETECT
51 #define COMPILE_MMX2
52 #endif
54 #if (HAVE_AMD3DNOW && !HAVE_MMX2) || CONFIG_RUNTIME_CPUDETECT
55 #define COMPILE_3DNOW
56 #endif
58 #endif /* ARCH_X86 */
60 #undef HAVE_MMX
61 #undef HAVE_MMX2
62 #undef HAVE_AMD3DNOW
63 #define HAVE_MMX 0
64 #define HAVE_MMX2 0
65 #define HAVE_AMD3DNOW 0
67 #if ! ARCH_X86
69 #ifdef COMPILE_C
70 #undef HAVE_MMX
71 #undef HAVE_MMX2
72 #undef HAVE_AMD3DNOW
73 #define HAVE_MMX 0
74 #define HAVE_MMX2 0
75 #define HAVE_AMD3DNOW 0
76 #define RENAME(a) a ## _C
77 #include "osd_template.c"
78 #endif
80 #else
82 //X86 noMMX versions
83 #ifdef COMPILE_C
84 #undef RENAME
85 #undef HAVE_MMX
86 #undef HAVE_MMX2
87 #undef HAVE_AMD3DNOW
88 #define HAVE_MMX 0
89 #define HAVE_MMX2 0
90 #define HAVE_AMD3DNOW 0
91 #define RENAME(a) a ## _X86
92 #include "osd_template.c"
93 #endif
95 //MMX versions
96 #ifdef COMPILE_MMX
97 #undef RENAME
98 #undef HAVE_MMX
99 #undef HAVE_MMX2
100 #undef HAVE_AMD3DNOW
101 #define HAVE_MMX 1
102 #define HAVE_MMX2 0
103 #define HAVE_AMD3DNOW 0
104 #define RENAME(a) a ## _MMX
105 #include "osd_template.c"
106 #endif
108 //MMX2 versions
109 #ifdef COMPILE_MMX2
110 #undef RENAME
111 #undef HAVE_MMX
112 #undef HAVE_MMX2
113 #undef HAVE_AMD3DNOW
114 #define HAVE_MMX 1
115 #define HAVE_MMX2 1
116 #define HAVE_AMD3DNOW 0
117 #define RENAME(a) a ## _MMX2
118 #include "osd_template.c"
119 #endif
121 //3DNOW versions
122 #ifdef COMPILE_3DNOW
123 #undef RENAME
124 #undef HAVE_MMX
125 #undef HAVE_MMX2
126 #undef HAVE_AMD3DNOW
127 #define HAVE_MMX 1
128 #define HAVE_MMX2 0
129 #define HAVE_AMD3DNOW 1
130 #define RENAME(a) a ## _3DNow
131 #include "osd_template.c"
132 #endif
134 #endif /* ARCH_X86 */
136 void vo_draw_alpha_yv12(int w,int h, unsigned char* src, unsigned char *srca, int srcstride, unsigned char* dstbase,int dststride){
137 #if CONFIG_RUNTIME_CPUDETECT
138 #if ARCH_X86
139 // ordered by speed / fastest first
140 if(gCpuCaps.hasMMX2)
141 vo_draw_alpha_yv12_MMX2(w, h, src, srca, srcstride, dstbase, dststride);
142 else if(gCpuCaps.has3DNow)
143 vo_draw_alpha_yv12_3DNow(w, h, src, srca, srcstride, dstbase, dststride);
144 else if(gCpuCaps.hasMMX)
145 vo_draw_alpha_yv12_MMX(w, h, src, srca, srcstride, dstbase, dststride);
146 else
147 vo_draw_alpha_yv12_X86(w, h, src, srca, srcstride, dstbase, dststride);
148 #else
149 vo_draw_alpha_yv12_C(w, h, src, srca, srcstride, dstbase, dststride);
150 #endif
151 #else //CONFIG_RUNTIME_CPUDETECT
152 #if HAVE_MMX2
153 vo_draw_alpha_yv12_MMX2(w, h, src, srca, srcstride, dstbase, dststride);
154 #elif HAVE_AMD3DNOW
155 vo_draw_alpha_yv12_3DNow(w, h, src, srca, srcstride, dstbase, dststride);
156 #elif HAVE_MMX
157 vo_draw_alpha_yv12_MMX(w, h, src, srca, srcstride, dstbase, dststride);
158 #elif ARCH_X86
159 vo_draw_alpha_yv12_X86(w, h, src, srca, srcstride, dstbase, dststride);
160 #else
161 vo_draw_alpha_yv12_C(w, h, src, srca, srcstride, dstbase, dststride);
162 #endif
163 #endif //!CONFIG_RUNTIME_CPUDETECT
166 void vo_draw_alpha_yuy2(int w,int h, unsigned char* src, unsigned char *srca, int srcstride, unsigned char* dstbase,int dststride){
167 #if CONFIG_RUNTIME_CPUDETECT
168 #if ARCH_X86
169 // ordered by speed / fastest first
170 if(gCpuCaps.hasMMX2)
171 vo_draw_alpha_yuy2_MMX2(w, h, src, srca, srcstride, dstbase, dststride);
172 else if(gCpuCaps.has3DNow)
173 vo_draw_alpha_yuy2_3DNow(w, h, src, srca, srcstride, dstbase, dststride);
174 else if(gCpuCaps.hasMMX)
175 vo_draw_alpha_yuy2_MMX(w, h, src, srca, srcstride, dstbase, dststride);
176 else
177 vo_draw_alpha_yuy2_X86(w, h, src, srca, srcstride, dstbase, dststride);
178 #else
179 vo_draw_alpha_yuy2_C(w, h, src, srca, srcstride, dstbase, dststride);
180 #endif
181 #else //CONFIG_RUNTIME_CPUDETECT
182 #if HAVE_MMX2
183 vo_draw_alpha_yuy2_MMX2(w, h, src, srca, srcstride, dstbase, dststride);
184 #elif HAVE_AMD3DNOW
185 vo_draw_alpha_yuy2_3DNow(w, h, src, srca, srcstride, dstbase, dststride);
186 #elif HAVE_MMX
187 vo_draw_alpha_yuy2_MMX(w, h, src, srca, srcstride, dstbase, dststride);
188 #elif ARCH_X86
189 vo_draw_alpha_yuy2_X86(w, h, src, srca, srcstride, dstbase, dststride);
190 #else
191 vo_draw_alpha_yuy2_C(w, h, src, srca, srcstride, dstbase, dststride);
192 #endif
193 #endif //!CONFIG_RUNTIME_CPUDETECT
196 void vo_draw_alpha_rgb24(int w,int h, unsigned char* src, unsigned char *srca, int srcstride, unsigned char* dstbase,int dststride){
197 #if CONFIG_RUNTIME_CPUDETECT
198 #if ARCH_X86
199 // ordered by speed / fastest first
200 if(gCpuCaps.hasMMX2)
201 vo_draw_alpha_rgb24_MMX2(w, h, src, srca, srcstride, dstbase, dststride);
202 else if(gCpuCaps.has3DNow)
203 vo_draw_alpha_rgb24_3DNow(w, h, src, srca, srcstride, dstbase, dststride);
204 else if(gCpuCaps.hasMMX)
205 vo_draw_alpha_rgb24_MMX(w, h, src, srca, srcstride, dstbase, dststride);
206 else
207 vo_draw_alpha_rgb24_X86(w, h, src, srca, srcstride, dstbase, dststride);
208 #else
209 vo_draw_alpha_rgb24_C(w, h, src, srca, srcstride, dstbase, dststride);
210 #endif
211 #else //CONFIG_RUNTIME_CPUDETECT
212 #if HAVE_MMX2
213 vo_draw_alpha_rgb24_MMX2(w, h, src, srca, srcstride, dstbase, dststride);
214 #elif HAVE_AMD3DNOW
215 vo_draw_alpha_rgb24_3DNow(w, h, src, srca, srcstride, dstbase, dststride);
216 #elif HAVE_MMX
217 vo_draw_alpha_rgb24_MMX(w, h, src, srca, srcstride, dstbase, dststride);
218 #elif ARCH_X86
219 vo_draw_alpha_rgb24_X86(w, h, src, srca, srcstride, dstbase, dststride);
220 #else
221 vo_draw_alpha_rgb24_C(w, h, src, srca, srcstride, dstbase, dststride);
222 #endif
223 #endif //!CONFIG_RUNTIME_CPUDETECT
226 void vo_draw_alpha_rgb32(int w,int h, unsigned char* src, unsigned char *srca, int srcstride, unsigned char* dstbase,int dststride){
227 #if CONFIG_RUNTIME_CPUDETECT
228 #if ARCH_X86
229 // ordered by speed / fastest first
230 if(gCpuCaps.hasMMX2)
231 vo_draw_alpha_rgb32_MMX2(w, h, src, srca, srcstride, dstbase, dststride);
232 else if(gCpuCaps.has3DNow)
233 vo_draw_alpha_rgb32_3DNow(w, h, src, srca, srcstride, dstbase, dststride);
234 else if(gCpuCaps.hasMMX)
235 vo_draw_alpha_rgb32_MMX(w, h, src, srca, srcstride, dstbase, dststride);
236 else
237 vo_draw_alpha_rgb32_X86(w, h, src, srca, srcstride, dstbase, dststride);
238 #else
239 vo_draw_alpha_rgb32_C(w, h, src, srca, srcstride, dstbase, dststride);
240 #endif
241 #else //CONFIG_RUNTIME_CPUDETECT
242 #if HAVE_MMX2
243 vo_draw_alpha_rgb32_MMX2(w, h, src, srca, srcstride, dstbase, dststride);
244 #elif HAVE_AMD3DNOW
245 vo_draw_alpha_rgb32_3DNow(w, h, src, srca, srcstride, dstbase, dststride);
246 #elif HAVE_MMX
247 vo_draw_alpha_rgb32_MMX(w, h, src, srca, srcstride, dstbase, dststride);
248 #elif ARCH_X86
249 vo_draw_alpha_rgb32_X86(w, h, src, srca, srcstride, dstbase, dststride);
250 #else
251 vo_draw_alpha_rgb32_C(w, h, src, srca, srcstride, dstbase, dststride);
252 #endif
253 #endif //!CONFIG_RUNTIME_CPUDETECT
256 #ifdef FAST_OSD_TABLE
257 static unsigned short fast_osd_12bpp_table[256];
258 static unsigned short fast_osd_15bpp_table[256];
259 static unsigned short fast_osd_16bpp_table[256];
260 #endif
262 void vo_draw_alpha_init(void){
263 #ifdef FAST_OSD_TABLE
264 int i;
265 for(i=0;i<256;i++){
266 fast_osd_12bpp_table[i]=((i>>4)<< 8)|((i>>4)<<4)|(i>>4);
267 fast_osd_15bpp_table[i]=((i>>3)<<10)|((i>>3)<<5)|(i>>3);
268 fast_osd_16bpp_table[i]=((i>>3)<<11)|((i>>2)<<5)|(i>>3);
270 #endif
271 //FIXME the optimized stuff is a lie for 15/16bpp as they aren't optimized yet
272 if( mp_msg_test(MSGT_OSD,MSGL_V) )
274 #if CONFIG_RUNTIME_CPUDETECT
275 #if ARCH_X86
276 // ordered per speed fasterst first
277 if(gCpuCaps.hasMMX2)
278 mp_msg(MSGT_OSD,MSGL_INFO,"Using MMX (with tiny bit MMX2) Optimized OnScreenDisplay\n");
279 else if(gCpuCaps.has3DNow)
280 mp_msg(MSGT_OSD,MSGL_INFO,"Using MMX (with tiny bit 3DNow) Optimized OnScreenDisplay\n");
281 else if(gCpuCaps.hasMMX)
282 mp_msg(MSGT_OSD,MSGL_INFO,"Using MMX Optimized OnScreenDisplay\n");
283 else
284 mp_msg(MSGT_OSD,MSGL_INFO,"Using X86 Optimized OnScreenDisplay\n");
285 #else
286 mp_msg(MSGT_OSD,MSGL_INFO,"Using Unoptimized OnScreenDisplay\n");
287 #endif
288 #else //CONFIG_RUNTIME_CPUDETECT
289 #if HAVE_MMX2
290 mp_msg(MSGT_OSD,MSGL_INFO,"Using MMX (with tiny bit MMX2) Optimized OnScreenDisplay\n");
291 #elif HAVE_AMD3DNOW
292 mp_msg(MSGT_OSD,MSGL_INFO,"Using MMX (with tiny bit 3DNow) Optimized OnScreenDisplay\n");
293 #elif HAVE_MMX
294 mp_msg(MSGT_OSD,MSGL_INFO,"Using MMX Optimized OnScreenDisplay\n");
295 #elif ARCH_X86
296 mp_msg(MSGT_OSD,MSGL_INFO,"Using X86 Optimized OnScreenDisplay\n");
297 #else
298 mp_msg(MSGT_OSD,MSGL_INFO,"Using Unoptimized OnScreenDisplay\n");
299 #endif
300 #endif //!CONFIG_RUNTIME_CPUDETECT
304 void vo_draw_alpha_rgb12(int w, int h, unsigned char* src, unsigned char *srca,
305 int srcstride, unsigned char* dstbase, int dststride) {
306 int y;
307 for (y = 0; y < h; y++) {
308 register unsigned short *dst = (unsigned short*) dstbase;
309 register int x;
310 for (x = 0; x < w; x++) {
311 if(srca[x]){
312 #ifdef FAST_OSD
313 #ifdef FAST_OSD_TABLE
314 dst[x] = fast_osd_12bpp_table[src[x]];
315 #else
316 register unsigned int a = src[x] >> 4;
317 dst[x] = (a << 8) | (a << 4) | a;
318 #endif
319 #else
320 unsigned char r = dst[x] & 0x0F;
321 unsigned char g = (dst[x] >> 4) & 0x0F;
322 unsigned char b = (dst[x] >> 8) & 0x0F;
323 r = (((r*srca[x]) >> 4) + src[x]) >> 4;
324 g = (((g*srca[x]) >> 4) + src[x]) >> 4;
325 b = (((b*srca[x]) >> 4) + src[x]) >> 4;
326 dst[x] = (b << 8) | (g << 4) | r;
327 #endif
330 src += srcstride;
331 srca += srcstride;
332 dstbase += dststride;
334 return;
337 void vo_draw_alpha_rgb15(int w,int h, unsigned char* src, unsigned char *srca, int srcstride, unsigned char* dstbase,int dststride){
338 int y;
339 for(y=0;y<h;y++){
340 register unsigned short *dst = (unsigned short*) dstbase;
341 register int x;
342 for(x=0;x<w;x++){
343 if(srca[x]){
344 #ifdef FAST_OSD
345 #ifdef FAST_OSD_TABLE
346 dst[x]=fast_osd_15bpp_table[src[x]];
347 #else
348 register unsigned int a=src[x]>>3;
349 dst[x]=(a<<10)|(a<<5)|a;
350 #endif
351 #else
352 unsigned char r=dst[x]&0x1F;
353 unsigned char g=(dst[x]>>5)&0x1F;
354 unsigned char b=(dst[x]>>10)&0x1F;
355 r=(((r*srca[x])>>5)+src[x])>>3;
356 g=(((g*srca[x])>>5)+src[x])>>3;
357 b=(((b*srca[x])>>5)+src[x])>>3;
358 dst[x]=(b<<10)|(g<<5)|r;
359 #endif
362 src+=srcstride;
363 srca+=srcstride;
364 dstbase+=dststride;
366 return;
369 void vo_draw_alpha_rgb16(int w,int h, unsigned char* src, unsigned char *srca, int srcstride, unsigned char* dstbase,int dststride){
370 int y;
371 for(y=0;y<h;y++){
372 register unsigned short *dst = (unsigned short*) dstbase;
373 register int x;
374 for(x=0;x<w;x++){
375 if(srca[x]){
376 #ifdef FAST_OSD
377 #ifdef FAST_OSD_TABLE
378 dst[x]=fast_osd_16bpp_table[src[x]];
379 #else
380 dst[x]=((src[x]>>3)<<11)|((src[x]>>2)<<5)|(src[x]>>3);
381 #endif
382 #else
383 unsigned char r=dst[x]&0x1F;
384 unsigned char g=(dst[x]>>5)&0x3F;
385 unsigned char b=(dst[x]>>11)&0x1F;
386 r=(((r*srca[x])>>5)+src[x])>>3;
387 g=(((g*srca[x])>>6)+src[x])>>2;
388 b=(((b*srca[x])>>5)+src[x])>>3;
389 dst[x]=(b<<11)|(g<<5)|r;
390 #endif
393 src+=srcstride;
394 srca+=srcstride;
395 dstbase+=dststride;
397 return;