increase max glyph and lines limit
[mplayer/glamo.git] / libvo / aclib.c
blobbc9bb2e55c3e1cdb5799f5a86aeac8bd70a19029
1 #include "config.h"
2 #ifdef CONFIG_FASTMEMCPY
4 /*
5 aclib - advanced C library ;)
6 This file contains functions which improve and expand standard C-library
7 see aclib_template.c ... this file only contains runtime cpu detection and config options stuff
8 runtime cpu detection by michael niedermayer (michaelni@gmx.at) is under GPL
9 */
10 #include <stddef.h>
11 #include <string.h>
12 #include "cpudetect.h"
13 #include "fastmemcpy.h"
14 #undef memcpy
16 #define BLOCK_SIZE 4096
17 #define CONFUSION_FACTOR 0
18 //Feel free to fine-tune the above 2, it might be possible to get some speedup with them :)
20 //#define STATISTICS
21 #if ARCH_X86
22 #define CAN_COMPILE_X86_ASM
23 #endif
25 //Note: we have MMX, MMX2, 3DNOW version there is no 3DNOW+MMX2 one
26 //Plain C versions
27 //#if !HAVE_MMX || defined (RUNTIME_CPUDETECT)
28 //#define COMPILE_C
29 //#endif
31 #ifdef CAN_COMPILE_X86_ASM
33 #if (HAVE_MMX && !HAVE_AMD3DNOW && !HAVE_MMX2) || defined (RUNTIME_CPUDETECT)
34 #define COMPILE_MMX
35 #endif
37 #if (HAVE_MMX2 && !HAVE_SSE2) || defined (RUNTIME_CPUDETECT)
38 #define COMPILE_MMX2
39 #endif
41 #if (HAVE_AMD3DNOW && !HAVE_MMX2) || defined (RUNTIME_CPUDETECT)
42 #define COMPILE_3DNOW
43 #endif
45 #if HAVE_SSE2 || defined (RUNTIME_CPUDETECT)
46 #define COMPILE_SSE
47 #endif
49 #undef HAVE_MMX
50 #undef HAVE_MMX2
51 #undef HAVE_AMD3DNOW
52 #undef HAVE_SSE
53 #undef HAVE_SSE2
54 #define HAVE_MMX 0
55 #define HAVE_MMX2 0
56 #define HAVE_AMD3DNOW 0
57 #define HAVE_SSE 0
58 #define HAVE_SSE2 0
60 #ifdef COMPILE_C
61 #undef HAVE_MMX
62 #undef HAVE_MMX2
63 #undef HAVE_AMD3DNOW
64 #undef HAVE_SSE
65 #undef HAVE_SSE2
66 #define HAVE_MMX 0
67 #define HAVE_MMX2 0
68 #define HAVE_AMD3DNOW 0
69 #define HAVE_SSE 0
70 #define HAVE_SSE2 0
71 #define RENAME(a) a ## _C
72 #include "aclib_template.c"
73 #endif
75 //MMX versions
76 #ifdef COMPILE_MMX
77 #undef RENAME
78 #undef HAVE_MMX
79 #undef HAVE_MMX2
80 #undef HAVE_AMD3DNOW
81 #undef HAVE_SSE
82 #undef HAVE_SSE2
83 #define HAVE_MMX 1
84 #define HAVE_MMX2 0
85 #define HAVE_AMD3DNOW 0
86 #define HAVE_SSE 0
87 #define HAVE_SSE2 0
88 #define RENAME(a) a ## _MMX
89 #include "aclib_template.c"
90 #endif
92 //MMX2 versions
93 #ifdef COMPILE_MMX2
94 #undef RENAME
95 #undef HAVE_MMX
96 #undef HAVE_MMX2
97 #undef HAVE_AMD3DNOW
98 #undef HAVE_SSE
99 #undef HAVE_SSE2
100 #define HAVE_MMX 1
101 #define HAVE_MMX2 1
102 #define HAVE_AMD3DNOW 0
103 #define HAVE_SSE 0
104 #define HAVE_SSE2 0
105 #define RENAME(a) a ## _MMX2
106 #include "aclib_template.c"
107 #endif
109 //3DNOW versions
110 #ifdef COMPILE_3DNOW
111 #undef RENAME
112 #undef HAVE_MMX
113 #undef HAVE_MMX2
114 #undef HAVE_AMD3DNOW
115 #undef HAVE_SSE
116 #undef HAVE_SSE2
117 #define HAVE_MMX 1
118 #define HAVE_MMX2 0
119 #define HAVE_AMD3DNOW 1
120 #define HAVE_SSE 0
121 #define HAVE_SSE2 0
122 #define RENAME(a) a ## _3DNow
123 #include "aclib_template.c"
124 #endif
126 //SSE versions (only used on SSE2 cpus)
127 #ifdef COMPILE_SSE
128 #undef RENAME
129 #undef HAVE_MMX
130 #undef HAVE_MMX2
131 #undef HAVE_AMD3DNOW
132 #undef HAVE_SSE
133 #undef HAVE_SSE2
134 #define HAVE_MMX 1
135 #define HAVE_MMX2 1
136 #define HAVE_AMD3DNOW 0
137 #define HAVE_SSE 1
138 #define HAVE_SSE2 1
139 #define RENAME(a) a ## _SSE
140 #include "aclib_template.c"
141 #endif
143 #endif // CAN_COMPILE_X86_ASM
146 #undef fast_memcpy
147 void * fast_memcpy(void * to, const void * from, size_t len)
149 #ifdef RUNTIME_CPUDETECT
150 #ifdef CAN_COMPILE_X86_ASM
151 // ordered per speed fasterst first
152 if(gCpuCaps.hasSSE2)
153 fast_memcpy_SSE(to, from, len);
154 else if(gCpuCaps.hasMMX2)
155 fast_memcpy_MMX2(to, from, len);
156 else if(gCpuCaps.has3DNow)
157 fast_memcpy_3DNow(to, from, len);
158 else if(gCpuCaps.hasMMX)
159 fast_memcpy_MMX(to, from, len);
160 else
161 #endif //CAN_COMPILE_X86_ASM
162 memcpy(to, from, len); // prior to mmx we use the standart memcpy
163 #else
164 #if HAVE_SSE2
165 fast_memcpy_SSE(to, from, len);
166 #elif HAVE_MMX2
167 fast_memcpy_MMX2(to, from, len);
168 #elif HAVE_AMD3DNOW
169 fast_memcpy_3DNow(to, from, len);
170 #elif HAVE_MMX
171 fast_memcpy_MMX(to, from, len);
172 #else
173 memcpy(to, from, len); // prior to mmx we use the standart memcpy
174 #endif
176 #endif //!RUNTIME_CPUDETECT
177 return to;
180 #undef mem2agpcpy
181 void * mem2agpcpy(void * to, const void * from, size_t len)
183 #ifdef RUNTIME_CPUDETECT
184 #ifdef CAN_COMPILE_X86_ASM
185 // ordered per speed fasterst first
186 if(gCpuCaps.hasSSE2)
187 mem2agpcpy_SSE(to, from, len);
188 else if(gCpuCaps.hasMMX2)
189 mem2agpcpy_MMX2(to, from, len);
190 else if(gCpuCaps.has3DNow)
191 mem2agpcpy_3DNow(to, from, len);
192 else if(gCpuCaps.hasMMX)
193 mem2agpcpy_MMX(to, from, len);
194 else
195 #endif //CAN_COMPILE_X86_ASM
196 memcpy(to, from, len); // prior to mmx we use the standart memcpy
197 #else
198 #if HAVE_SSE2
199 mem2agpcpy_SSE(to, from, len);
200 #elif HAVE_MMX2
201 mem2agpcpy_MMX2(to, from, len);
202 #elif HAVE_AMD3DNOW
203 mem2agpcpy_3DNow(to, from, len);
204 #elif HAVE_MMX
205 mem2agpcpy_MMX(to, from, len);
206 #else
207 memcpy(to, from, len); // prior to mmx we use the standart memcpy
208 #endif
210 #endif //!RUNTIME_CPUDETECT
211 return to;
214 #endif /* CONFIG_FASTMEMCPY */