20 #include <linux/string.h>
21 #include <linux/module.h>
22 #include <linux/sched.h>
23 #include <linux/types.h>
48 ".section .fixup, \"ax\"\n"
49 "3: movw $0x1AEB, 1b\n"
57 "1: prefetch 320(%0)\n"
58 "2: movq (%0), %%mm0\n"
59 " movq 8(%0), %%mm1\n"
60 " movq 16(%0), %%mm2\n"
61 " movq 24(%0), %%mm3\n"
63 " movq %%mm1, 8(%1)\n"
64 " movq %%mm2, 16(%1)\n"
65 " movq %%mm3, 24(%1)\n"
66 " movq 32(%0), %%mm0\n"
67 " movq 40(%0), %%mm1\n"
68 " movq 48(%0), %%mm2\n"
69 " movq 56(%0), %%mm3\n"
70 " movq %%mm0, 32(%1)\n"
71 " movq %%mm1, 40(%1)\n"
72 " movq %%mm2, 48(%1)\n"
73 " movq %%mm3, 56(%1)\n"
74 ".section .fixup, \"ax\"\n"
75 "3: movw $0x05EB, 1b\n"
79 : :
"r" (from),
"r" (to) :
"memory");
88 " movq 8(%0), %%mm1\n"
89 " movq 16(%0), %%mm2\n"
90 " movq 24(%0), %%mm3\n"
92 " movq %%mm1, 8(%1)\n"
93 " movq %%mm2, 16(%1)\n"
94 " movq %%mm3, 24(%1)\n"
95 " movq 32(%0), %%mm0\n"
96 " movq 40(%0), %%mm1\n"
97 " movq 48(%0), %%mm2\n"
98 " movq 56(%0), %%mm3\n"
99 " movq %%mm0, 32(%1)\n"
100 " movq %%mm1, 40(%1)\n"
101 " movq %%mm2, 48(%1)\n"
102 " movq %%mm3, 56(%1)\n"
103 : :
"r" (from),
"r" (to) :
"memory");
125 static void fast_clear_page(
void *
page)
132 " pxor %%mm0, %%mm0\n" : :
135 for (i = 0; i < 4096/64; i++) {
137 " movntq %%mm0, (%0)\n"
138 " movntq %%mm0, 8(%0)\n"
139 " movntq %%mm0, 16(%0)\n"
140 " movntq %%mm0, 24(%0)\n"
141 " movntq %%mm0, 32(%0)\n"
142 " movntq %%mm0, 40(%0)\n"
143 " movntq %%mm0, 48(%0)\n"
144 " movntq %%mm0, 56(%0)\n"
145 : :
"r" (page) :
"memory");
153 __asm__ __volatile__(
"sfence\n"::);
158 static void fast_copy_page(
void *to,
void *
from)
171 " prefetch 128(%0)\n"
172 " prefetch 192(%0)\n"
173 " prefetch 256(%0)\n"
175 ".section .fixup, \"ax\"\n"
176 "3: movw $0x1AEB, 1b\n"
181 for (i = 0; i < (4096-320)/64; i++) {
183 "1: prefetch 320(%0)\n"
184 "2: movq (%0), %%mm0\n"
185 " movntq %%mm0, (%1)\n"
186 " movq 8(%0), %%mm1\n"
187 " movntq %%mm1, 8(%1)\n"
188 " movq 16(%0), %%mm2\n"
189 " movntq %%mm2, 16(%1)\n"
190 " movq 24(%0), %%mm3\n"
191 " movntq %%mm3, 24(%1)\n"
192 " movq 32(%0), %%mm4\n"
193 " movntq %%mm4, 32(%1)\n"
194 " movq 40(%0), %%mm5\n"
195 " movntq %%mm5, 40(%1)\n"
196 " movq 48(%0), %%mm6\n"
197 " movntq %%mm6, 48(%1)\n"
198 " movq 56(%0), %%mm7\n"
199 " movntq %%mm7, 56(%1)\n"
200 ".section .fixup, \"ax\"\n"
201 "3: movw $0x05EB, 1b\n"
210 for (i = (4096-320)/64; i < 4096/64; i++) {
212 "2: movq (%0), %%mm0\n"
213 " movntq %%mm0, (%1)\n"
214 " movq 8(%0), %%mm1\n"
215 " movntq %%mm1, 8(%1)\n"
216 " movq 16(%0), %%mm2\n"
217 " movntq %%mm2, 16(%1)\n"
218 " movq 24(%0), %%mm3\n"
219 " movntq %%mm3, 24(%1)\n"
220 " movq 32(%0), %%mm4\n"
221 " movntq %%mm4, 32(%1)\n"
222 " movq 40(%0), %%mm5\n"
223 " movntq %%mm5, 40(%1)\n"
224 " movq 48(%0), %%mm6\n"
225 " movntq %%mm6, 48(%1)\n"
226 " movq 56(%0), %%mm7\n"
227 " movntq %%mm7, 56(%1)\n"
228 : :
"r" (from),
"r" (to) :
"memory");
236 __asm__ __volatile__(
"sfence \n"::);
245 static void fast_clear_page(
void *page)
252 " pxor %%mm0, %%mm0\n" : :
255 for (i = 0; i < 4096/128; i++) {
257 " movq %%mm0, (%0)\n"
258 " movq %%mm0, 8(%0)\n"
259 " movq %%mm0, 16(%0)\n"
260 " movq %%mm0, 24(%0)\n"
261 " movq %%mm0, 32(%0)\n"
262 " movq %%mm0, 40(%0)\n"
263 " movq %%mm0, 48(%0)\n"
264 " movq %%mm0, 56(%0)\n"
265 " movq %%mm0, 64(%0)\n"
266 " movq %%mm0, 72(%0)\n"
267 " movq %%mm0, 80(%0)\n"
268 " movq %%mm0, 88(%0)\n"
269 " movq %%mm0, 96(%0)\n"
270 " movq %%mm0, 104(%0)\n"
271 " movq %%mm0, 112(%0)\n"
272 " movq %%mm0, 120(%0)\n"
273 : :
"r" (page) :
"memory");
280 static void fast_copy_page(
void *to,
void *from)
289 " prefetch 128(%0)\n"
290 " prefetch 192(%0)\n"
291 " prefetch 256(%0)\n"
293 ".section .fixup, \"ax\"\n"
294 "3: movw $0x1AEB, 1b\n"
299 for (i = 0; i < 4096/64; i++) {
301 "1: prefetch 320(%0)\n"
302 "2: movq (%0), %%mm0\n"
303 " movq 8(%0), %%mm1\n"
304 " movq 16(%0), %%mm2\n"
305 " movq 24(%0), %%mm3\n"
306 " movq %%mm0, (%1)\n"
307 " movq %%mm1, 8(%1)\n"
308 " movq %%mm2, 16(%1)\n"
309 " movq %%mm3, 24(%1)\n"
310 " movq 32(%0), %%mm0\n"
311 " movq 40(%0), %%mm1\n"
312 " movq 48(%0), %%mm2\n"
313 " movq 56(%0), %%mm3\n"
314 " movq %%mm0, 32(%1)\n"
315 " movq %%mm1, 40(%1)\n"
316 " movq %%mm2, 48(%1)\n"
317 " movq %%mm3, 56(%1)\n"
318 ".section .fixup, \"ax\"\n"
319 "3: movw $0x05EB, 1b\n"
323 : :
"r" (from),
"r" (to) :
"memory");
336 static void slow_zero_page(
void *page)
344 :
"=&c" (d0),
"=&D" (d1)
345 :
"a" (0),
"1" (page),
"0" (1024)
352 slow_zero_page(page);
354 fast_clear_page(page);
358 static void slow_copy_page(
void *to,
void *from)
365 :
"=&c" (d0),
"=&D" (d1),
"=&S" (d2)
366 :
"0" (1024),
"1" ((
long) to),
"2" ((
long) from)
373 slow_copy_page(to, from);
375 fast_copy_page(to, from);