Skip to content
This repository has been archived by the owner on Feb 11, 2021. It is now read-only.

Latest commit

 

History

History
159 lines (141 loc) · 4.36 KB

SDL_blit_copy.c

File metadata and controls

159 lines (141 loc) · 4.36 KB
 
Apr 8, 2011
Apr 8, 2011
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
Simple DirectMedia Layer
Copyright (C) 1997-2011 Sam Lantinga <slouken@libsdl.org>
This software is provided 'as-is', without any express or implied
warranty. In no event will the authors be held liable for any damages
arising from the use of this software.
Permission is granted to anyone to use this software for any purpose,
including commercial applications, and to alter it and redistribute it
freely, subject to the following restrictions:
1. The origin of this software must not be misrepresented; you must not
claim that you wrote the original software. If you use this software
in a product, an acknowledgment in the product documentation would be
appreciated but is not required.
2. Altered source versions must be plainly marked as such, and must not be
misrepresented as being the original software.
3. This notice may not be removed or altered from any source distribution.
20
21
22
23
24
*/
#include "SDL_config.h"
#include "SDL_video.h"
#include "SDL_blit.h"
Aug 16, 2007
Aug 16, 2007
25
#include "SDL_blit_copy.h"
Aug 16, 2007
Aug 16, 2007
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
#ifdef __SSE__
/* This assumes 16-byte aligned src and dst */
static __inline__ void
SDL_memcpySSE(Uint8 * dst, const Uint8 * src, int len)
{
int i;
__m128 values[4];
for (i = len / 64; i--;) {
_mm_prefetch(src, _MM_HINT_NTA);
values[0] = *(__m128 *) (src + 0);
values[1] = *(__m128 *) (src + 16);
values[2] = *(__m128 *) (src + 32);
values[3] = *(__m128 *) (src + 48);
_mm_stream_ps((float *) (dst + 0), values[0]);
_mm_stream_ps((float *) (dst + 16), values[1]);
_mm_stream_ps((float *) (dst + 32), values[2]);
_mm_stream_ps((float *) (dst + 48), values[3]);
src += 64;
dst += 64;
}
if (len & 63)
SDL_memcpy(dst, src, len & 63);
}
#endif /* __SSE__ */
Nov 24, 2008
Nov 24, 2008
56
57
58
#ifdef _MSC_VER
#pragma warning(disable:4799)
#endif
Aug 16, 2007
Aug 16, 2007
59
/* This assumes 8-byte aligned src and dst */
60
static __inline__ void
Aug 16, 2007
Aug 16, 2007
61
SDL_memcpyMMX(Uint8 * dst, const Uint8 * src, int len)
Aug 16, 2007
Aug 16, 2007
65
__m64 values[8];
66
for (i = len / 64; i--;) {
Dec 16, 2009
Dec 16, 2009
67
#ifdef __SSE__
Aug 16, 2007
Aug 16, 2007
68
_mm_prefetch(src, _MM_HINT_NTA);
Dec 16, 2009
Dec 16, 2009
69
#endif
Aug 16, 2007
Aug 16, 2007
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
values[0] = *(__m64 *) (src + 0);
values[1] = *(__m64 *) (src + 8);
values[2] = *(__m64 *) (src + 16);
values[3] = *(__m64 *) (src + 24);
values[4] = *(__m64 *) (src + 32);
values[5] = *(__m64 *) (src + 40);
values[6] = *(__m64 *) (src + 48);
values[7] = *(__m64 *) (src + 56);
_mm_stream_pi((__m64 *) (dst + 0), values[0]);
_mm_stream_pi((__m64 *) (dst + 8), values[1]);
_mm_stream_pi((__m64 *) (dst + 16), values[2]);
_mm_stream_pi((__m64 *) (dst + 24), values[3]);
_mm_stream_pi((__m64 *) (dst + 32), values[4]);
_mm_stream_pi((__m64 *) (dst + 40), values[5]);
_mm_stream_pi((__m64 *) (dst + 48), values[6]);
_mm_stream_pi((__m64 *) (dst + 56), values[7]);
86
87
88
src += 64;
dst += 64;
}
Aug 16, 2007
Aug 16, 2007
89
90
91
92
93
94
95
96
97
if (len & 63)
SDL_memcpy(dst, src, len & 63);
}
#endif /* __MMX__ */
void
SDL_BlitCopy(SDL_BlitInfo * info)
{
Feb 16, 2011
Feb 16, 2011
98
SDL_bool overlap;
99
100
101
102
Uint8 *src, *dst;
int w, h;
int srcskip, dstskip;
Aug 18, 2007
Aug 18, 2007
103
w = info->dst_w * info->dst_fmt->BytesPerPixel;
Aug 17, 2007
Aug 17, 2007
104
105
106
h = info->dst_h;
src = info->src;
dst = info->dst;
Aug 18, 2007
Aug 18, 2007
107
108
srcskip = info->src_pitch;
dstskip = info->dst_pitch;
Feb 16, 2011
Feb 16, 2011
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
/* Properly handle overlapping blits */
if (src < dst) {
overlap = (dst < (src + h*srcskip));
} else {
overlap = (src < (dst + h*dstskip));
}
if (overlap) {
while (h--) {
SDL_memmove(dst, src, w);
src += srcskip;
dst += dstskip;
}
return;
}
Dec 3, 2008
Dec 3, 2008
126
127
128
if (SDL_HasSSE() &&
!((uintptr_t) src & 15) && !(srcskip & 15) &&
!((uintptr_t) dst & 15) && !(dstskip & 15)) {
129
130
131
132
133
134
135
136
137
138
while (h--) {
SDL_memcpySSE(dst, src, w);
src += srcskip;
dst += dstskip;
}
return;
}
#endif
#ifdef __MMX__
Dec 3, 2008
Dec 3, 2008
139
140
141
if (SDL_HasMMX() &&
!((uintptr_t) src & 7) && !(srcskip & 7) &&
!((uintptr_t) dst & 7) && !(dstskip & 7)) {
142
143
144
145
146
while (h--) {
SDL_memcpyMMX(dst, src, w);
src += srcskip;
dst += dstskip;
}
Aug 16, 2007
Aug 16, 2007
147
_mm_empty();
148
149
150
151
152
153
154
155
156
157
158
159
return;
}
#endif
while (h--) {
SDL_memcpy(dst, src, w);
src += srcskip;
dst += dstskip;
}
}
/* vi: set ts=4 sw=4 expandtab: */