]> git.ipfire.org Git - thirdparty/qemu.git/blob - tests/test-i386.c
9f1c4f0038f4ecd1912bb84f17aaf444c27fd2a2
[thirdparty/qemu.git] / tests / test-i386.c
1 /*
2 * x86 CPU test
3 *
4 * Copyright (c) 2003 Fabrice Bellard
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
19 */
20 #define _GNU_SOURCE
21 #include <stdlib.h>
22 #include <stdio.h>
23 #include <string.h>
24 #include <inttypes.h>
25 #include <math.h>
26 #include <signal.h>
27 #include <setjmp.h>
28 #include <errno.h>
29 #include <sys/ucontext.h>
30 #include <sys/mman.h>
31 #include <asm/vm86.h>
32
33 #define TEST_CMOV 0
34 #define TEST_FCOMI 0
35 #define TEST_VM86
36 //#define LINUX_VM86_IOPL_FIX
37 //#define TEST_P4_FLAGS
38 //#define TEST_SSE
39
40 #define xglue(x, y) x ## y
41 #define glue(x, y) xglue(x, y)
42 #define stringify(s) tostring(s)
43 #define tostring(s) #s
44
45 #define CC_C 0x0001
46 #define CC_P 0x0004
47 #define CC_A 0x0010
48 #define CC_Z 0x0040
49 #define CC_S 0x0080
50 #define CC_O 0x0800
51
52 #define __init_call __attribute__ ((unused,__section__ (".initcall.init")))
53
54 static void *call_start __init_call = NULL;
55
56 #define CC_MASK (CC_C | CC_P | CC_Z | CC_S | CC_O | CC_A)
57
58 #define OP add
59 #include "test-i386.h"
60
61 #define OP sub
62 #include "test-i386.h"
63
64 #define OP xor
65 #include "test-i386.h"
66
67 #define OP and
68 #include "test-i386.h"
69
70 #define OP or
71 #include "test-i386.h"
72
73 #define OP cmp
74 #include "test-i386.h"
75
76 #define OP adc
77 #define OP_CC
78 #include "test-i386.h"
79
80 #define OP sbb
81 #define OP_CC
82 #include "test-i386.h"
83
84 #define OP inc
85 #define OP_CC
86 #define OP1
87 #include "test-i386.h"
88
89 #define OP dec
90 #define OP_CC
91 #define OP1
92 #include "test-i386.h"
93
94 #define OP neg
95 #define OP_CC
96 #define OP1
97 #include "test-i386.h"
98
99 #define OP not
100 #define OP_CC
101 #define OP1
102 #include "test-i386.h"
103
104 #undef CC_MASK
105 #define CC_MASK (CC_C | CC_P | CC_Z | CC_S | CC_O)
106
107 #define OP shl
108 #include "test-i386-shift.h"
109
110 #define OP shr
111 #include "test-i386-shift.h"
112
113 #define OP sar
114 #include "test-i386-shift.h"
115
116 #define OP rol
117 #include "test-i386-shift.h"
118
119 #define OP ror
120 #include "test-i386-shift.h"
121
122 #define OP rcr
123 #define OP_CC
124 #include "test-i386-shift.h"
125
126 #define OP rcl
127 #define OP_CC
128 #include "test-i386-shift.h"
129
130 #define OP shld
131 #define OP_SHIFTD
132 #define OP_NOBYTE
133 #include "test-i386-shift.h"
134
135 #define OP shrd
136 #define OP_SHIFTD
137 #define OP_NOBYTE
138 #include "test-i386-shift.h"
139
140 /* XXX: should be more precise ? */
141 #undef CC_MASK
142 #define CC_MASK (CC_C)
143
144 #define OP bt
145 #define OP_NOBYTE
146 #include "test-i386-shift.h"
147
148 #define OP bts
149 #define OP_NOBYTE
150 #include "test-i386-shift.h"
151
152 #define OP btr
153 #define OP_NOBYTE
154 #include "test-i386-shift.h"
155
156 #define OP btc
157 #define OP_NOBYTE
158 #include "test-i386-shift.h"
159
160 /* lea test (modrm support) */
161 #define TEST_LEA(STR)\
162 {\
163 asm("leal " STR ", %0"\
164 : "=r" (res)\
165 : "a" (eax), "b" (ebx), "c" (ecx), "d" (edx), "S" (esi), "D" (edi));\
166 printf("lea %s = %08x\n", STR, res);\
167 }
168
169 #define TEST_LEA16(STR)\
170 {\
171 asm(".code16 ; .byte 0x67 ; leal " STR ", %0 ; .code32"\
172 : "=wq" (res)\
173 : "a" (eax), "b" (ebx), "c" (ecx), "d" (edx), "S" (esi), "D" (edi));\
174 printf("lea %s = %08x\n", STR, res);\
175 }
176
177
178 void test_lea(void)
179 {
180 int eax, ebx, ecx, edx, esi, edi, res;
181 eax = 0x0001;
182 ebx = 0x0002;
183 ecx = 0x0004;
184 edx = 0x0008;
185 esi = 0x0010;
186 edi = 0x0020;
187
188 TEST_LEA("0x4000");
189
190 TEST_LEA("(%%eax)");
191 TEST_LEA("(%%ebx)");
192 TEST_LEA("(%%ecx)");
193 TEST_LEA("(%%edx)");
194 TEST_LEA("(%%esi)");
195 TEST_LEA("(%%edi)");
196
197 TEST_LEA("0x40(%%eax)");
198 TEST_LEA("0x40(%%ebx)");
199 TEST_LEA("0x40(%%ecx)");
200 TEST_LEA("0x40(%%edx)");
201 TEST_LEA("0x40(%%esi)");
202 TEST_LEA("0x40(%%edi)");
203
204 TEST_LEA("0x4000(%%eax)");
205 TEST_LEA("0x4000(%%ebx)");
206 TEST_LEA("0x4000(%%ecx)");
207 TEST_LEA("0x4000(%%edx)");
208 TEST_LEA("0x4000(%%esi)");
209 TEST_LEA("0x4000(%%edi)");
210
211 TEST_LEA("(%%eax, %%ecx)");
212 TEST_LEA("(%%ebx, %%edx)");
213 TEST_LEA("(%%ecx, %%ecx)");
214 TEST_LEA("(%%edx, %%ecx)");
215 TEST_LEA("(%%esi, %%ecx)");
216 TEST_LEA("(%%edi, %%ecx)");
217
218 TEST_LEA("0x40(%%eax, %%ecx)");
219 TEST_LEA("0x4000(%%ebx, %%edx)");
220
221 TEST_LEA("(%%ecx, %%ecx, 2)");
222 TEST_LEA("(%%edx, %%ecx, 4)");
223 TEST_LEA("(%%esi, %%ecx, 8)");
224
225 TEST_LEA("(,%%eax, 2)");
226 TEST_LEA("(,%%ebx, 4)");
227 TEST_LEA("(,%%ecx, 8)");
228
229 TEST_LEA("0x40(,%%eax, 2)");
230 TEST_LEA("0x40(,%%ebx, 4)");
231 TEST_LEA("0x40(,%%ecx, 8)");
232
233
234 TEST_LEA("-10(%%ecx, %%ecx, 2)");
235 TEST_LEA("-10(%%edx, %%ecx, 4)");
236 TEST_LEA("-10(%%esi, %%ecx, 8)");
237
238 TEST_LEA("0x4000(%%ecx, %%ecx, 2)");
239 TEST_LEA("0x4000(%%edx, %%ecx, 4)");
240 TEST_LEA("0x4000(%%esi, %%ecx, 8)");
241
242 /* limited 16 bit addressing test */
243 TEST_LEA16("0x4000");
244 TEST_LEA16("(%%bx)");
245 TEST_LEA16("(%%si)");
246 TEST_LEA16("(%%di)");
247 TEST_LEA16("0x40(%%bx)");
248 TEST_LEA16("0x40(%%si)");
249 TEST_LEA16("0x40(%%di)");
250 TEST_LEA16("0x4000(%%bx)");
251 TEST_LEA16("0x4000(%%si)");
252 TEST_LEA16("(%%bx,%%si)");
253 TEST_LEA16("(%%bx,%%di)");
254 TEST_LEA16("0x40(%%bx,%%si)");
255 TEST_LEA16("0x40(%%bx,%%di)");
256 TEST_LEA16("0x4000(%%bx,%%si)");
257 TEST_LEA16("0x4000(%%bx,%%di)");
258 }
259
260 #define TEST_JCC(JCC, v1, v2)\
261 {\
262 int res;\
263 asm("movl $1, %0\n\t"\
264 "cmpl %2, %1\n\t"\
265 "j" JCC " 1f\n\t"\
266 "movl $0, %0\n\t"\
267 "1:\n\t"\
268 : "=r" (res)\
269 : "r" (v1), "r" (v2));\
270 printf("%-10s %d\n", "j" JCC, res);\
271 \
272 asm("movl $0, %0\n\t"\
273 "cmpl %2, %1\n\t"\
274 "set" JCC " %b0\n\t"\
275 : "=r" (res)\
276 : "r" (v1), "r" (v2));\
277 printf("%-10s %d\n", "set" JCC, res);\
278 if (TEST_CMOV) {\
279 asm("movl $0x12345678, %0\n\t"\
280 "cmpl %2, %1\n\t"\
281 "cmov" JCC "l %3, %0\n\t"\
282 : "=r" (res)\
283 : "r" (v1), "r" (v2), "m" (1));\
284 printf("%-10s R=0x%08x\n", "cmov" JCC "l", res);\
285 asm("movl $0x12345678, %0\n\t"\
286 "cmpl %2, %1\n\t"\
287 "cmov" JCC "w %w3, %w0\n\t"\
288 : "=r" (res)\
289 : "r" (v1), "r" (v2), "r" (1));\
290 printf("%-10s R=0x%08x\n", "cmov" JCC "w", res);\
291 } \
292 }
293
294 /* various jump tests */
295 void test_jcc(void)
296 {
297 TEST_JCC("ne", 1, 1);
298 TEST_JCC("ne", 1, 0);
299
300 TEST_JCC("e", 1, 1);
301 TEST_JCC("e", 1, 0);
302
303 TEST_JCC("l", 1, 1);
304 TEST_JCC("l", 1, 0);
305 TEST_JCC("l", 1, -1);
306
307 TEST_JCC("le", 1, 1);
308 TEST_JCC("le", 1, 0);
309 TEST_JCC("le", 1, -1);
310
311 TEST_JCC("ge", 1, 1);
312 TEST_JCC("ge", 1, 0);
313 TEST_JCC("ge", -1, 1);
314
315 TEST_JCC("g", 1, 1);
316 TEST_JCC("g", 1, 0);
317 TEST_JCC("g", 1, -1);
318
319 TEST_JCC("b", 1, 1);
320 TEST_JCC("b", 1, 0);
321 TEST_JCC("b", 1, -1);
322
323 TEST_JCC("be", 1, 1);
324 TEST_JCC("be", 1, 0);
325 TEST_JCC("be", 1, -1);
326
327 TEST_JCC("ae", 1, 1);
328 TEST_JCC("ae", 1, 0);
329 TEST_JCC("ae", 1, -1);
330
331 TEST_JCC("a", 1, 1);
332 TEST_JCC("a", 1, 0);
333 TEST_JCC("a", 1, -1);
334
335
336 TEST_JCC("p", 1, 1);
337 TEST_JCC("p", 1, 0);
338
339 TEST_JCC("np", 1, 1);
340 TEST_JCC("np", 1, 0);
341
342 TEST_JCC("o", 0x7fffffff, 0);
343 TEST_JCC("o", 0x7fffffff, -1);
344
345 TEST_JCC("no", 0x7fffffff, 0);
346 TEST_JCC("no", 0x7fffffff, -1);
347
348 TEST_JCC("s", 0, 1);
349 TEST_JCC("s", 0, -1);
350 TEST_JCC("s", 0, 0);
351
352 TEST_JCC("ns", 0, 1);
353 TEST_JCC("ns", 0, -1);
354 TEST_JCC("ns", 0, 0);
355 }
356
357 #undef CC_MASK
358 #ifdef TEST_P4_FLAGS
359 #define CC_MASK (CC_C | CC_P | CC_Z | CC_S | CC_O | CC_A)
360 #else
361 #define CC_MASK (CC_O | CC_C)
362 #endif
363
364 #define OP mul
365 #include "test-i386-muldiv.h"
366
367 #define OP imul
368 #include "test-i386-muldiv.h"
369
370 void test_imulw2(int op0, int op1)
371 {
372 int res, s1, s0, flags;
373 s0 = op0;
374 s1 = op1;
375 res = s0;
376 flags = 0;
377 asm volatile ("push %4\n\t"
378 "popf\n\t"
379 "imulw %w2, %w0\n\t"
380 "pushf\n\t"
381 "popl %1\n\t"
382 : "=q" (res), "=g" (flags)
383 : "q" (s1), "0" (res), "1" (flags));
384 printf("%-10s A=%08x B=%08x R=%08x CC=%04x\n",
385 "imulw", s0, s1, res, flags & CC_MASK);
386 }
387
388 void test_imull2(int op0, int op1)
389 {
390 int res, s1, s0, flags;
391 s0 = op0;
392 s1 = op1;
393 res = s0;
394 flags = 0;
395 asm volatile ("push %4\n\t"
396 "popf\n\t"
397 "imull %2, %0\n\t"
398 "pushf\n\t"
399 "popl %1\n\t"
400 : "=q" (res), "=g" (flags)
401 : "q" (s1), "0" (res), "1" (flags));
402 printf("%-10s A=%08x B=%08x R=%08x CC=%04x\n",
403 "imull", s0, s1, res, flags & CC_MASK);
404 }
405
406 #define TEST_IMUL_IM(size, size1, op0, op1)\
407 {\
408 int res, flags;\
409 flags = 0;\
410 res = 0;\
411 asm volatile ("push %3\n\t"\
412 "popf\n\t"\
413 "imul" size " $" #op0 ", %" size1 "2, %" size1 "0\n\t" \
414 "pushf\n\t"\
415 "popl %1\n\t"\
416 : "=r" (res), "=g" (flags)\
417 : "r" (op1), "1" (flags), "0" (res));\
418 printf("%-10s A=%08x B=%08x R=%08x CC=%04x\n",\
419 "imul" size " im", op0, op1, res, flags & CC_MASK);\
420 }
421
422
423 #undef CC_MASK
424 #define CC_MASK (0)
425
426 #define OP div
427 #include "test-i386-muldiv.h"
428
429 #define OP idiv
430 #include "test-i386-muldiv.h"
431
432 void test_mul(void)
433 {
434 test_imulb(0x1234561d, 4);
435 test_imulb(3, -4);
436 test_imulb(0x80, 0x80);
437 test_imulb(0x10, 0x10);
438
439 test_imulw(0, 0x1234001d, 45);
440 test_imulw(0, 23, -45);
441 test_imulw(0, 0x8000, 0x8000);
442 test_imulw(0, 0x100, 0x100);
443
444 test_imull(0, 0x1234001d, 45);
445 test_imull(0, 23, -45);
446 test_imull(0, 0x80000000, 0x80000000);
447 test_imull(0, 0x10000, 0x10000);
448
449 test_mulb(0x1234561d, 4);
450 test_mulb(3, -4);
451 test_mulb(0x80, 0x80);
452 test_mulb(0x10, 0x10);
453
454 test_mulw(0, 0x1234001d, 45);
455 test_mulw(0, 23, -45);
456 test_mulw(0, 0x8000, 0x8000);
457 test_mulw(0, 0x100, 0x100);
458
459 test_mull(0, 0x1234001d, 45);
460 test_mull(0, 23, -45);
461 test_mull(0, 0x80000000, 0x80000000);
462 test_mull(0, 0x10000, 0x10000);
463
464 test_imulw2(0x1234001d, 45);
465 test_imulw2(23, -45);
466 test_imulw2(0x8000, 0x8000);
467 test_imulw2(0x100, 0x100);
468
469 test_imull2(0x1234001d, 45);
470 test_imull2(23, -45);
471 test_imull2(0x80000000, 0x80000000);
472 test_imull2(0x10000, 0x10000);
473
474 TEST_IMUL_IM("w", "w", 45, 0x1234);
475 TEST_IMUL_IM("w", "w", -45, 23);
476 TEST_IMUL_IM("w", "w", 0x8000, 0x80000000);
477 TEST_IMUL_IM("w", "w", 0x7fff, 0x1000);
478
479 TEST_IMUL_IM("l", "", 45, 0x1234);
480 TEST_IMUL_IM("l", "", -45, 23);
481 TEST_IMUL_IM("l", "", 0x8000, 0x80000000);
482 TEST_IMUL_IM("l", "", 0x7fff, 0x1000);
483
484 test_idivb(0x12341678, 0x127e);
485 test_idivb(0x43210123, -5);
486 test_idivb(0x12340004, -1);
487
488 test_idivw(0, 0x12345678, 12347);
489 test_idivw(0, -23223, -45);
490 test_idivw(0, 0x12348000, -1);
491 test_idivw(0x12343, 0x12345678, 0x81238567);
492
493 test_idivl(0, 0x12345678, 12347);
494 test_idivl(0, -233223, -45);
495 test_idivl(0, 0x80000000, -1);
496 test_idivl(0x12343, 0x12345678, 0x81234567);
497
498 test_divb(0x12341678, 0x127e);
499 test_divb(0x43210123, -5);
500 test_divb(0x12340004, -1);
501
502 test_divw(0, 0x12345678, 12347);
503 test_divw(0, -23223, -45);
504 test_divw(0, 0x12348000, -1);
505 test_divw(0x12343, 0x12345678, 0x81238567);
506
507 test_divl(0, 0x12345678, 12347);
508 test_divl(0, -233223, -45);
509 test_divl(0, 0x80000000, -1);
510 test_divl(0x12343, 0x12345678, 0x81234567);
511 }
512
513 #define TEST_BSX(op, size, op0)\
514 {\
515 int res, val, resz;\
516 val = op0;\
517 asm("xorl %1, %1\n"\
518 "movl $0x12345678, %0\n"\
519 #op " %" size "2, %" size "0 ; setz %b1" \
520 : "=r" (res), "=q" (resz)\
521 : "g" (val));\
522 printf("%-10s A=%08x R=%08x %d\n", #op, val, res, resz);\
523 }
524
525 void test_bsx(void)
526 {
527 TEST_BSX(bsrw, "w", 0);
528 TEST_BSX(bsrw, "w", 0x12340128);
529 TEST_BSX(bsrl, "", 0);
530 TEST_BSX(bsrl, "", 0x00340128);
531 TEST_BSX(bsfw, "w", 0);
532 TEST_BSX(bsfw, "w", 0x12340128);
533 TEST_BSX(bsfl, "", 0);
534 TEST_BSX(bsfl, "", 0x00340128);
535 }
536
537 /**********************************************/
538
539 void test_fops(double a, double b)
540 {
541 printf("a=%f b=%f a+b=%f\n", a, b, a + b);
542 printf("a=%f b=%f a-b=%f\n", a, b, a - b);
543 printf("a=%f b=%f a*b=%f\n", a, b, a * b);
544 printf("a=%f b=%f a/b=%f\n", a, b, a / b);
545 printf("a=%f b=%f fmod(a, b)=%f\n", a, b, fmod(a, b));
546 printf("a=%f sqrt(a)=%f\n", a, sqrt(a));
547 printf("a=%f sin(a)=%f\n", a, sin(a));
548 printf("a=%f cos(a)=%f\n", a, cos(a));
549 printf("a=%f tan(a)=%f\n", a, tan(a));
550 printf("a=%f log(a)=%f\n", a, log(a));
551 printf("a=%f exp(a)=%f\n", a, exp(a));
552 printf("a=%f b=%f atan2(a, b)=%f\n", a, b, atan2(a, b));
553 /* just to test some op combining */
554 printf("a=%f asin(sin(a))=%f\n", a, asin(sin(a)));
555 printf("a=%f acos(cos(a))=%f\n", a, acos(cos(a)));
556 printf("a=%f atan(tan(a))=%f\n", a, atan(tan(a)));
557
558 }
559
560 void test_fcmp(double a, double b)
561 {
562 printf("(%f<%f)=%d\n",
563 a, b, a < b);
564 printf("(%f<=%f)=%d\n",
565 a, b, a <= b);
566 printf("(%f==%f)=%d\n",
567 a, b, a == b);
568 printf("(%f>%f)=%d\n",
569 a, b, a > b);
570 printf("(%f<=%f)=%d\n",
571 a, b, a >= b);
572 if (TEST_FCOMI) {
573 unsigned int eflags;
574 /* test f(u)comi instruction */
575 asm("fcomi %2, %1\n"
576 "pushf\n"
577 "pop %0\n"
578 : "=r" (eflags)
579 : "t" (a), "u" (b));
580 printf("fcomi(%f %f)=%08x\n", a, b, eflags & (CC_Z | CC_P | CC_C));
581 }
582 }
583
584 void test_fcvt(double a)
585 {
586 float fa;
587 long double la;
588 int16_t fpuc;
589 int i;
590 int64_t lla;
591 int ia;
592 int16_t wa;
593 double ra;
594
595 fa = a;
596 la = a;
597 printf("(float)%f = %f\n", a, fa);
598 printf("(long double)%f = %Lf\n", a, la);
599 printf("a=%016Lx\n", *(long long *)&a);
600 printf("la=%016Lx %04x\n", *(long long *)&la,
601 *(unsigned short *)((char *)(&la) + 8));
602
603 /* test all roundings */
604 asm volatile ("fstcw %0" : "=m" (fpuc));
605 for(i=0;i<4;i++) {
606 asm volatile ("fldcw %0" : : "m" ((fpuc & ~0x0c00) | (i << 10)));
607 asm volatile ("fist %0" : "=m" (wa) : "t" (a));
608 asm volatile ("fistl %0" : "=m" (ia) : "t" (a));
609 asm volatile ("fistpll %0" : "=m" (lla) : "t" (a) : "st");
610 asm volatile ("frndint ; fstl %0" : "=m" (ra) : "t" (a));
611 asm volatile ("fldcw %0" : : "m" (fpuc));
612 printf("(short)a = %d\n", wa);
613 printf("(int)a = %d\n", ia);
614 printf("(int64_t)a = %Ld\n", lla);
615 printf("rint(a) = %f\n", ra);
616 }
617 }
618
619 #define TEST(N) \
620 asm("fld" #N : "=t" (a)); \
621 printf("fld" #N "= %f\n", a);
622
623 void test_fconst(void)
624 {
625 double a;
626 TEST(1);
627 TEST(l2t);
628 TEST(l2e);
629 TEST(pi);
630 TEST(lg2);
631 TEST(ln2);
632 TEST(z);
633 }
634
635 void test_fbcd(double a)
636 {
637 unsigned short bcd[5];
638 double b;
639
640 asm("fbstp %0" : "=m" (bcd[0]) : "t" (a) : "st");
641 asm("fbld %1" : "=t" (b) : "m" (bcd[0]));
642 printf("a=%f bcd=%04x%04x%04x%04x%04x b=%f\n",
643 a, bcd[4], bcd[3], bcd[2], bcd[1], bcd[0], b);
644 }
645
646 #define TEST_ENV(env, save, restore)\
647 {\
648 memset((env), 0xaa, sizeof(*(env)));\
649 for(i=0;i<5;i++)\
650 asm volatile ("fldl %0" : : "m" (dtab[i]));\
651 asm volatile (save " %0\n" : : "m" (*(env)));\
652 asm volatile (restore " %0\n": : "m" (*(env)));\
653 for(i=0;i<5;i++)\
654 asm volatile ("fstpl %0" : "=m" (rtab[i]));\
655 for(i=0;i<5;i++)\
656 printf("res[%d]=%f\n", i, rtab[i]);\
657 printf("fpuc=%04x fpus=%04x fptag=%04x\n",\
658 (env)->fpuc,\
659 (env)->fpus & 0xff00,\
660 (env)->fptag);\
661 }
662
663 void test_fenv(void)
664 {
665 struct __attribute__((packed)) {
666 uint16_t fpuc;
667 uint16_t dummy1;
668 uint16_t fpus;
669 uint16_t dummy2;
670 uint16_t fptag;
671 uint16_t dummy3;
672 uint32_t ignored[4];
673 long double fpregs[8];
674 } float_env32;
675 struct __attribute__((packed)) {
676 uint16_t fpuc;
677 uint16_t fpus;
678 uint16_t fptag;
679 uint16_t ignored[4];
680 long double fpregs[8];
681 } float_env16;
682 double dtab[8];
683 double rtab[8];
684 int i;
685
686 for(i=0;i<8;i++)
687 dtab[i] = i + 1;
688
689 TEST_ENV(&float_env16, "data16 fnstenv", "data16 fldenv");
690 TEST_ENV(&float_env16, "data16 fnsave", "data16 frstor");
691 TEST_ENV(&float_env32, "fnstenv", "fldenv");
692 TEST_ENV(&float_env32, "fnsave", "frstor");
693
694 /* test for ffree */
695 for(i=0;i<5;i++)
696 asm volatile ("fldl %0" : : "m" (dtab[i]));
697 asm volatile("ffree %st(2)");
698 asm volatile ("fnstenv %0\n" : : "m" (float_env32));
699 asm volatile ("fninit");
700 printf("fptag=%04x\n", float_env32.fptag);
701 }
702
703
704 #define TEST_FCMOV(a, b, eflags, CC)\
705 {\
706 double res;\
707 asm("push %3\n"\
708 "popf\n"\
709 "fcmov" CC " %2, %0\n"\
710 : "=t" (res)\
711 : "0" (a), "u" (b), "g" (eflags));\
712 printf("fcmov%s eflags=0x%04x-> %f\n", \
713 CC, eflags, res);\
714 }
715
716 void test_fcmov(void)
717 {
718 double a, b;
719 int eflags, i;
720
721 a = 1.0;
722 b = 2.0;
723 for(i = 0; i < 4; i++) {
724 eflags = 0;
725 if (i & 1)
726 eflags |= CC_C;
727 if (i & 2)
728 eflags |= CC_Z;
729 TEST_FCMOV(a, b, eflags, "b");
730 TEST_FCMOV(a, b, eflags, "e");
731 TEST_FCMOV(a, b, eflags, "be");
732 TEST_FCMOV(a, b, eflags, "nb");
733 TEST_FCMOV(a, b, eflags, "ne");
734 TEST_FCMOV(a, b, eflags, "nbe");
735 }
736 TEST_FCMOV(a, b, 0, "u");
737 TEST_FCMOV(a, b, CC_P, "u");
738 TEST_FCMOV(a, b, 0, "nu");
739 TEST_FCMOV(a, b, CC_P, "nu");
740 }
741
742 void test_floats(void)
743 {
744 test_fops(2, 3);
745 test_fops(1.4, -5);
746 test_fcmp(2, -1);
747 test_fcmp(2, 2);
748 test_fcmp(2, 3);
749 test_fcvt(0.5);
750 test_fcvt(-0.5);
751 test_fcvt(1.0/7.0);
752 test_fcvt(-1.0/9.0);
753 test_fcvt(32768);
754 test_fcvt(-1e20);
755 test_fconst();
756 test_fbcd(1234567890123456);
757 test_fbcd(-123451234567890);
758 test_fenv();
759 if (TEST_CMOV) {
760 test_fcmov();
761 }
762 }
763
764 /**********************************************/
765
766 #define TEST_BCD(op, op0, cc_in, cc_mask)\
767 {\
768 int res, flags;\
769 res = op0;\
770 flags = cc_in;\
771 asm ("push %3\n\t"\
772 "popf\n\t"\
773 #op "\n\t"\
774 "pushf\n\t"\
775 "popl %1\n\t"\
776 : "=a" (res), "=g" (flags)\
777 : "0" (res), "1" (flags));\
778 printf("%-10s A=%08x R=%08x CCIN=%04x CC=%04x\n",\
779 #op, op0, res, cc_in, flags & cc_mask);\
780 }
781
782 void test_bcd(void)
783 {
784 TEST_BCD(daa, 0x12340503, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
785 TEST_BCD(daa, 0x12340506, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
786 TEST_BCD(daa, 0x12340507, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
787 TEST_BCD(daa, 0x12340559, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
788 TEST_BCD(daa, 0x12340560, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
789 TEST_BCD(daa, 0x1234059f, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
790 TEST_BCD(daa, 0x123405a0, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
791 TEST_BCD(daa, 0x12340503, 0, (CC_C | CC_P | CC_Z | CC_S | CC_A));
792 TEST_BCD(daa, 0x12340506, 0, (CC_C | CC_P | CC_Z | CC_S | CC_A));
793 TEST_BCD(daa, 0x12340503, CC_C, (CC_C | CC_P | CC_Z | CC_S | CC_A));
794 TEST_BCD(daa, 0x12340506, CC_C, (CC_C | CC_P | CC_Z | CC_S | CC_A));
795 TEST_BCD(daa, 0x12340503, CC_C | CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
796 TEST_BCD(daa, 0x12340506, CC_C | CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
797
798 TEST_BCD(das, 0x12340503, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
799 TEST_BCD(das, 0x12340506, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
800 TEST_BCD(das, 0x12340507, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
801 TEST_BCD(das, 0x12340559, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
802 TEST_BCD(das, 0x12340560, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
803 TEST_BCD(das, 0x1234059f, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
804 TEST_BCD(das, 0x123405a0, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
805 TEST_BCD(das, 0x12340503, 0, (CC_C | CC_P | CC_Z | CC_S | CC_A));
806 TEST_BCD(das, 0x12340506, 0, (CC_C | CC_P | CC_Z | CC_S | CC_A));
807 TEST_BCD(das, 0x12340503, CC_C, (CC_C | CC_P | CC_Z | CC_S | CC_A));
808 TEST_BCD(das, 0x12340506, CC_C, (CC_C | CC_P | CC_Z | CC_S | CC_A));
809 TEST_BCD(das, 0x12340503, CC_C | CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
810 TEST_BCD(das, 0x12340506, CC_C | CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_A));
811
812 TEST_BCD(aaa, 0x12340205, CC_A, (CC_C | CC_A));
813 TEST_BCD(aaa, 0x12340306, CC_A, (CC_C | CC_A));
814 TEST_BCD(aaa, 0x1234040a, CC_A, (CC_C | CC_A));
815 TEST_BCD(aaa, 0x123405fa, CC_A, (CC_C | CC_A));
816 TEST_BCD(aaa, 0x12340205, 0, (CC_C | CC_A));
817 TEST_BCD(aaa, 0x12340306, 0, (CC_C | CC_A));
818 TEST_BCD(aaa, 0x1234040a, 0, (CC_C | CC_A));
819 TEST_BCD(aaa, 0x123405fa, 0, (CC_C | CC_A));
820
821 TEST_BCD(aas, 0x12340205, CC_A, (CC_C | CC_A));
822 TEST_BCD(aas, 0x12340306, CC_A, (CC_C | CC_A));
823 TEST_BCD(aas, 0x1234040a, CC_A, (CC_C | CC_A));
824 TEST_BCD(aas, 0x123405fa, CC_A, (CC_C | CC_A));
825 TEST_BCD(aas, 0x12340205, 0, (CC_C | CC_A));
826 TEST_BCD(aas, 0x12340306, 0, (CC_C | CC_A));
827 TEST_BCD(aas, 0x1234040a, 0, (CC_C | CC_A));
828 TEST_BCD(aas, 0x123405fa, 0, (CC_C | CC_A));
829
830 TEST_BCD(aam, 0x12340547, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_O | CC_A));
831 TEST_BCD(aad, 0x12340407, CC_A, (CC_C | CC_P | CC_Z | CC_S | CC_O | CC_A));
832 }
833
834 #define TEST_XCHG(op, size, opconst)\
835 {\
836 int op0, op1;\
837 op0 = 0x12345678;\
838 op1 = 0xfbca7654;\
839 asm(#op " %" size "0, %" size "1" \
840 : "=q" (op0), opconst (op1) \
841 : "0" (op0), "1" (op1));\
842 printf("%-10s A=%08x B=%08x\n",\
843 #op, op0, op1);\
844 }
845
846 #define TEST_CMPXCHG(op, size, opconst, eax)\
847 {\
848 int op0, op1;\
849 op0 = 0x12345678;\
850 op1 = 0xfbca7654;\
851 asm(#op " %" size "0, %" size "1" \
852 : "=q" (op0), opconst (op1) \
853 : "0" (op0), "1" (op1), "a" (eax));\
854 printf("%-10s EAX=%08x A=%08x C=%08x\n",\
855 #op, eax, op0, op1);\
856 }
857
858 void test_xchg(void)
859 {
860 TEST_XCHG(xchgl, "", "=q");
861 TEST_XCHG(xchgw, "w", "=q");
862 TEST_XCHG(xchgb, "b", "=q");
863
864 TEST_XCHG(xchgl, "", "=m");
865 TEST_XCHG(xchgw, "w", "=m");
866 TEST_XCHG(xchgb, "b", "=m");
867
868 TEST_XCHG(xaddl, "", "=q");
869 TEST_XCHG(xaddw, "w", "=q");
870 TEST_XCHG(xaddb, "b", "=q");
871
872 {
873 int res;
874 res = 0x12345678;
875 asm("xaddl %1, %0" : "=r" (res) : "0" (res));
876 printf("xaddl same res=%08x\n", res);
877 }
878
879 TEST_XCHG(xaddl, "", "=m");
880 TEST_XCHG(xaddw, "w", "=m");
881 TEST_XCHG(xaddb, "b", "=m");
882
883 TEST_CMPXCHG(cmpxchgl, "", "=q", 0xfbca7654);
884 TEST_CMPXCHG(cmpxchgw, "w", "=q", 0xfbca7654);
885 TEST_CMPXCHG(cmpxchgb, "b", "=q", 0xfbca7654);
886
887 TEST_CMPXCHG(cmpxchgl, "", "=q", 0xfffefdfc);
888 TEST_CMPXCHG(cmpxchgw, "w", "=q", 0xfffefdfc);
889 TEST_CMPXCHG(cmpxchgb, "b", "=q", 0xfffefdfc);
890
891 TEST_CMPXCHG(cmpxchgl, "", "=m", 0xfbca7654);
892 TEST_CMPXCHG(cmpxchgw, "w", "=m", 0xfbca7654);
893 TEST_CMPXCHG(cmpxchgb, "b", "=m", 0xfbca7654);
894
895 TEST_CMPXCHG(cmpxchgl, "", "=m", 0xfffefdfc);
896 TEST_CMPXCHG(cmpxchgw, "w", "=m", 0xfffefdfc);
897 TEST_CMPXCHG(cmpxchgb, "b", "=m", 0xfffefdfc);
898
899 {
900 uint64_t op0, op1, op2;
901 int i, eflags;
902
903 for(i = 0; i < 2; i++) {
904 op0 = 0x123456789abcd;
905 if (i == 0)
906 op1 = 0xfbca765423456;
907 else
908 op1 = op0;
909 op2 = 0x6532432432434;
910 asm("cmpxchg8b %1\n"
911 "pushf\n"
912 "popl %2\n"
913 : "=A" (op0), "=m" (op1), "=g" (eflags)
914 : "0" (op0), "m" (op1), "b" ((int)op2), "c" ((int)(op2 >> 32)));
915 printf("cmpxchg8b: op0=%016llx op1=%016llx CC=%02x\n",
916 op0, op1, eflags & CC_Z);
917 }
918 }
919 }
920
921 /**********************************************/
922 /* segmentation tests */
923
924 #include <asm/ldt.h>
925 #include <linux/unistd.h>
926 #include <linux/version.h>
927
928 _syscall3(int, modify_ldt, int, func, void *, ptr, unsigned long, bytecount)
929
930 #if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 5, 66)
931 #define modify_ldt_ldt_s user_desc
932 #endif
933
934 uint8_t seg_data1[4096];
935 uint8_t seg_data2[4096];
936
937 #define MK_SEL(n) (((n) << 3) | 7)
938
939 #define TEST_LR(op, size, seg, mask)\
940 {\
941 int res, res2;\
942 res = 0x12345678;\
943 asm (op " %" size "2, %" size "0\n" \
944 "movl $0, %1\n"\
945 "jnz 1f\n"\
946 "movl $1, %1\n"\
947 "1:\n"\
948 : "=r" (res), "=r" (res2) : "m" (seg), "0" (res));\
949 printf(op ": Z=%d %08x\n", res2, res & ~(mask));\
950 }
951
952 /* NOTE: we use Linux modify_ldt syscall */
953 void test_segs(void)
954 {
955 struct modify_ldt_ldt_s ldt;
956 long long ldt_table[3];
957 int res, res2;
958 char tmp;
959 struct {
960 uint32_t offset;
961 uint16_t seg;
962 } __attribute__((packed)) segoff;
963
964 ldt.entry_number = 1;
965 ldt.base_addr = (unsigned long)&seg_data1;
966 ldt.limit = (sizeof(seg_data1) + 0xfff) >> 12;
967 ldt.seg_32bit = 1;
968 ldt.contents = MODIFY_LDT_CONTENTS_DATA;
969 ldt.read_exec_only = 0;
970 ldt.limit_in_pages = 1;
971 ldt.seg_not_present = 0;
972 ldt.useable = 1;
973 modify_ldt(1, &ldt, sizeof(ldt)); /* write ldt entry */
974
975 ldt.entry_number = 2;
976 ldt.base_addr = (unsigned long)&seg_data2;
977 ldt.limit = (sizeof(seg_data2) + 0xfff) >> 12;
978 ldt.seg_32bit = 1;
979 ldt.contents = MODIFY_LDT_CONTENTS_DATA;
980 ldt.read_exec_only = 0;
981 ldt.limit_in_pages = 1;
982 ldt.seg_not_present = 0;
983 ldt.useable = 1;
984 modify_ldt(1, &ldt, sizeof(ldt)); /* write ldt entry */
985
986 modify_ldt(0, &ldt_table, sizeof(ldt_table)); /* read ldt entries */
987 #if 0
988 {
989 int i;
990 for(i=0;i<3;i++)
991 printf("%d: %016Lx\n", i, ldt_table[i]);
992 }
993 #endif
994 /* do some tests with fs or gs */
995 asm volatile ("movl %0, %%fs" : : "r" (MK_SEL(1)));
996
997 seg_data1[1] = 0xaa;
998 seg_data2[1] = 0x55;
999
1000 asm volatile ("fs movzbl 0x1, %0" : "=r" (res));
1001 printf("FS[1] = %02x\n", res);
1002
1003 asm volatile ("pushl %%gs\n"
1004 "movl %1, %%gs\n"
1005 "gs movzbl 0x1, %0\n"
1006 "popl %%gs\n"
1007 : "=r" (res)
1008 : "r" (MK_SEL(2)));
1009 printf("GS[1] = %02x\n", res);
1010
1011 /* tests with ds/ss (implicit segment case) */
1012 tmp = 0xa5;
1013 asm volatile ("pushl %%ebp\n\t"
1014 "pushl %%ds\n\t"
1015 "movl %2, %%ds\n\t"
1016 "movl %3, %%ebp\n\t"
1017 "movzbl 0x1, %0\n\t"
1018 "movzbl (%%ebp), %1\n\t"
1019 "popl %%ds\n\t"
1020 "popl %%ebp\n\t"
1021 : "=r" (res), "=r" (res2)
1022 : "r" (MK_SEL(1)), "r" (&tmp));
1023 printf("DS[1] = %02x\n", res);
1024 printf("SS[tmp] = %02x\n", res2);
1025
1026 segoff.seg = MK_SEL(2);
1027 segoff.offset = 0xabcdef12;
1028 asm volatile("lfs %2, %0\n\t"
1029 "movl %%fs, %1\n\t"
1030 : "=r" (res), "=g" (res2)
1031 : "m" (segoff));
1032 printf("FS:reg = %04x:%08x\n", res2, res);
1033
1034 TEST_LR("larw", "w", MK_SEL(2), 0x0100);
1035 TEST_LR("larl", "", MK_SEL(2), 0x0100);
1036 TEST_LR("lslw", "w", MK_SEL(2), 0);
1037 TEST_LR("lsll", "", MK_SEL(2), 0);
1038
1039 TEST_LR("larw", "w", 0xfff8, 0);
1040 TEST_LR("larl", "", 0xfff8, 0);
1041 TEST_LR("lslw", "w", 0xfff8, 0);
1042 TEST_LR("lsll", "", 0xfff8, 0);
1043 }
1044
1045 /* 16 bit code test */
1046 extern char code16_start, code16_end;
1047 extern char code16_func1;
1048 extern char code16_func2;
1049 extern char code16_func3;
1050
1051 void test_code16(void)
1052 {
1053 struct modify_ldt_ldt_s ldt;
1054 int res, res2;
1055
1056 /* build a code segment */
1057 ldt.entry_number = 1;
1058 ldt.base_addr = (unsigned long)&code16_start;
1059 ldt.limit = &code16_end - &code16_start;
1060 ldt.seg_32bit = 0;
1061 ldt.contents = MODIFY_LDT_CONTENTS_CODE;
1062 ldt.read_exec_only = 0;
1063 ldt.limit_in_pages = 0;
1064 ldt.seg_not_present = 0;
1065 ldt.useable = 1;
1066 modify_ldt(1, &ldt, sizeof(ldt)); /* write ldt entry */
1067
1068 /* call the first function */
1069 asm volatile ("lcall %1, %2"
1070 : "=a" (res)
1071 : "i" (MK_SEL(1)), "i" (&code16_func1): "memory", "cc");
1072 printf("func1() = 0x%08x\n", res);
1073 asm volatile ("lcall %2, %3"
1074 : "=a" (res), "=c" (res2)
1075 : "i" (MK_SEL(1)), "i" (&code16_func2): "memory", "cc");
1076 printf("func2() = 0x%08x spdec=%d\n", res, res2);
1077 asm volatile ("lcall %1, %2"
1078 : "=a" (res)
1079 : "i" (MK_SEL(1)), "i" (&code16_func3): "memory", "cc");
1080 printf("func3() = 0x%08x\n", res);
1081 }
1082
1083 extern char func_lret32;
1084 extern char func_iret32;
1085
1086 void test_misc(void)
1087 {
1088 char table[256];
1089 int res, i;
1090
1091 for(i=0;i<256;i++) table[i] = 256 - i;
1092 res = 0x12345678;
1093 asm ("xlat" : "=a" (res) : "b" (table), "0" (res));
1094 printf("xlat: EAX=%08x\n", res);
1095
1096 asm volatile ("pushl %%cs ; call %1"
1097 : "=a" (res)
1098 : "m" (func_lret32): "memory", "cc");
1099 printf("func_lret32=%x\n", res);
1100
1101 asm volatile ("pushfl ; pushl %%cs ; call %1"
1102 : "=a" (res)
1103 : "m" (func_iret32): "memory", "cc");
1104 printf("func_iret32=%x\n", res);
1105
1106 /* specific popl test */
1107 asm volatile ("pushl $12345432 ; pushl $0x9abcdef ; popl (%%esp) ; popl %0"
1108 : "=g" (res));
1109 printf("popl esp=%x\n", res);
1110
1111 /* specific popw test */
1112 asm volatile ("pushl $12345432 ; pushl $0x9abcdef ; popw (%%esp) ; addl $2, %%esp ; popl %0"
1113 : "=g" (res));
1114 printf("popw esp=%x\n", res);
1115 }
1116
1117 uint8_t str_buffer[4096];
1118
1119 #define TEST_STRING1(OP, size, DF, REP)\
1120 {\
1121 int esi, edi, eax, ecx, eflags;\
1122 \
1123 esi = (long)(str_buffer + sizeof(str_buffer) / 2);\
1124 edi = (long)(str_buffer + sizeof(str_buffer) / 2) + 16;\
1125 eax = 0x12345678;\
1126 ecx = 17;\
1127 \
1128 asm volatile ("pushl $0\n\t"\
1129 "popf\n\t"\
1130 DF "\n\t"\
1131 REP #OP size "\n\t"\
1132 "cld\n\t"\
1133 "pushf\n\t"\
1134 "popl %4\n\t"\
1135 : "=S" (esi), "=D" (edi), "=a" (eax), "=c" (ecx), "=g" (eflags)\
1136 : "0" (esi), "1" (edi), "2" (eax), "3" (ecx));\
1137 printf("%-10s ESI=%08x EDI=%08x EAX=%08x ECX=%08x EFL=%04x\n",\
1138 REP #OP size, esi, edi, eax, ecx,\
1139 eflags & (CC_C | CC_P | CC_Z | CC_S | CC_O | CC_A));\
1140 }
1141
1142 #define TEST_STRING(OP, REP)\
1143 TEST_STRING1(OP, "b", "", REP);\
1144 TEST_STRING1(OP, "w", "", REP);\
1145 TEST_STRING1(OP, "l", "", REP);\
1146 TEST_STRING1(OP, "b", "std", REP);\
1147 TEST_STRING1(OP, "w", "std", REP);\
1148 TEST_STRING1(OP, "l", "std", REP)
1149
1150 void test_string(void)
1151 {
1152 int i;
1153 for(i = 0;i < sizeof(str_buffer); i++)
1154 str_buffer[i] = i + 0x56;
1155 TEST_STRING(stos, "");
1156 TEST_STRING(stos, "rep ");
1157 TEST_STRING(lods, ""); /* to verify stos */
1158 TEST_STRING(lods, "rep ");
1159 TEST_STRING(movs, "");
1160 TEST_STRING(movs, "rep ");
1161 TEST_STRING(lods, ""); /* to verify stos */
1162
1163 /* XXX: better tests */
1164 TEST_STRING(scas, "");
1165 TEST_STRING(scas, "repz ");
1166 TEST_STRING(scas, "repnz ");
1167 TEST_STRING(cmps, "");
1168 TEST_STRING(cmps, "repz ");
1169 TEST_STRING(cmps, "repnz ");
1170 }
1171
1172 /* VM86 test */
1173
1174 static inline void set_bit(uint8_t *a, unsigned int bit)
1175 {
1176 a[bit / 8] |= (1 << (bit % 8));
1177 }
1178
1179 static inline uint8_t *seg_to_linear(unsigned int seg, unsigned int reg)
1180 {
1181 return (uint8_t *)((seg << 4) + (reg & 0xffff));
1182 }
1183
1184 static inline void pushw(struct vm86_regs *r, int val)
1185 {
1186 r->esp = (r->esp & ~0xffff) | ((r->esp - 2) & 0xffff);
1187 *(uint16_t *)seg_to_linear(r->ss, r->esp) = val;
1188 }
1189
1190 #undef __syscall_return
1191 #define __syscall_return(type, res) \
1192 do { \
1193 return (type) (res); \
1194 } while (0)
1195
1196 _syscall2(int, vm86, int, func, struct vm86plus_struct *, v86)
1197
1198 extern char vm86_code_start;
1199 extern char vm86_code_end;
1200
1201 #define VM86_CODE_CS 0x100
1202 #define VM86_CODE_IP 0x100
1203
1204 void test_vm86(void)
1205 {
1206 struct vm86plus_struct ctx;
1207 struct vm86_regs *r;
1208 uint8_t *vm86_mem;
1209 int seg, ret;
1210
1211 vm86_mem = mmap((void *)0x00000000, 0x110000,
1212 PROT_WRITE | PROT_READ | PROT_EXEC,
1213 MAP_FIXED | MAP_ANON | MAP_PRIVATE, -1, 0);
1214 if (vm86_mem == MAP_FAILED) {
1215 printf("ERROR: could not map vm86 memory");
1216 return;
1217 }
1218 memset(&ctx, 0, sizeof(ctx));
1219
1220 /* init basic registers */
1221 r = &ctx.regs;
1222 r->eip = VM86_CODE_IP;
1223 r->esp = 0xfffe;
1224 seg = VM86_CODE_CS;
1225 r->cs = seg;
1226 r->ss = seg;
1227 r->ds = seg;
1228 r->es = seg;
1229 r->fs = seg;
1230 r->gs = seg;
1231 r->eflags = VIF_MASK;
1232
1233 /* move code to proper address. We use the same layout as a .com
1234 dos program. */
1235 memcpy(vm86_mem + (VM86_CODE_CS << 4) + VM86_CODE_IP,
1236 &vm86_code_start, &vm86_code_end - &vm86_code_start);
1237
1238 /* mark int 0x21 as being emulated */
1239 set_bit((uint8_t *)&ctx.int_revectored, 0x21);
1240
1241 for(;;) {
1242 ret = vm86(VM86_ENTER, &ctx);
1243 switch(VM86_TYPE(ret)) {
1244 case VM86_INTx:
1245 {
1246 int int_num, ah, v;
1247
1248 int_num = VM86_ARG(ret);
1249 if (int_num != 0x21)
1250 goto unknown_int;
1251 ah = (r->eax >> 8) & 0xff;
1252 switch(ah) {
1253 case 0x00: /* exit */
1254 goto the_end;
1255 case 0x02: /* write char */
1256 {
1257 uint8_t c = r->edx;
1258 putchar(c);
1259 }
1260 break;
1261 case 0x09: /* write string */
1262 {
1263 uint8_t c, *ptr;
1264 ptr = seg_to_linear(r->ds, r->edx);
1265 for(;;) {
1266 c = *ptr++;
1267 if (c == '$')
1268 break;
1269 putchar(c);
1270 }
1271 r->eax = (r->eax & ~0xff) | '$';
1272 }
1273 break;
1274 case 0xff: /* extension: write eflags number in edx */
1275 v = (int)r->edx;
1276 #ifndef LINUX_VM86_IOPL_FIX
1277 v &= ~0x3000;
1278 #endif
1279 printf("%08x\n", v);
1280 break;
1281 default:
1282 unknown_int:
1283 printf("unsupported int 0x%02x\n", int_num);
1284 goto the_end;
1285 }
1286 }
1287 break;
1288 case VM86_SIGNAL:
1289 /* a signal came, we just ignore that */
1290 break;
1291 case VM86_STI:
1292 break;
1293 default:
1294 printf("ERROR: unhandled vm86 return code (0x%x)\n", ret);
1295 goto the_end;
1296 }
1297 }
1298 the_end:
1299 printf("VM86 end\n");
1300 munmap(vm86_mem, 0x110000);
1301 }
1302
1303 /* exception tests */
1304 #ifndef REG_EAX
1305 #define REG_EAX EAX
1306 #define REG_EBX EBX
1307 #define REG_ECX ECX
1308 #define REG_EDX EDX
1309 #define REG_ESI ESI
1310 #define REG_EDI EDI
1311 #define REG_EBP EBP
1312 #define REG_ESP ESP
1313 #define REG_EIP EIP
1314 #define REG_EFL EFL
1315 #define REG_TRAPNO TRAPNO
1316 #define REG_ERR ERR
1317 #endif
1318
1319 jmp_buf jmp_env;
1320 int v1;
1321 int tab[2];
1322
1323 void sig_handler(int sig, siginfo_t *info, void *puc)
1324 {
1325 struct ucontext *uc = puc;
1326
1327 printf("si_signo=%d si_errno=%d si_code=%d",
1328 info->si_signo, info->si_errno, info->si_code);
1329 printf(" si_addr=0x%08lx",
1330 (unsigned long)info->si_addr);
1331 printf("\n");
1332
1333 printf("trapno=0x%02x err=0x%08x",
1334 uc->uc_mcontext.gregs[REG_TRAPNO],
1335 uc->uc_mcontext.gregs[REG_ERR]);
1336 printf(" EIP=0x%08x", uc->uc_mcontext.gregs[REG_EIP]);
1337 printf("\n");
1338 longjmp(jmp_env, 1);
1339 }
1340
1341 void test_exceptions(void)
1342 {
1343 struct modify_ldt_ldt_s ldt;
1344 struct sigaction act;
1345 volatile int val;
1346
1347 act.sa_sigaction = sig_handler;
1348 sigemptyset(&act.sa_mask);
1349 act.sa_flags = SA_SIGINFO;
1350 sigaction(SIGFPE, &act, NULL);
1351 sigaction(SIGILL, &act, NULL);
1352 sigaction(SIGSEGV, &act, NULL);
1353 sigaction(SIGBUS, &act, NULL);
1354 sigaction(SIGTRAP, &act, NULL);
1355
1356 /* test division by zero reporting */
1357 printf("DIVZ exception:\n");
1358 if (setjmp(jmp_env) == 0) {
1359 /* now divide by zero */
1360 v1 = 0;
1361 v1 = 2 / v1;
1362 }
1363
1364 printf("BOUND exception:\n");
1365 if (setjmp(jmp_env) == 0) {
1366 /* bound exception */
1367 tab[0] = 1;
1368 tab[1] = 10;
1369 asm volatile ("bound %0, %1" : : "r" (11), "m" (tab[0]));
1370 }
1371
1372 printf("segment exceptions:\n");
1373 if (setjmp(jmp_env) == 0) {
1374 /* load an invalid segment */
1375 asm volatile ("movl %0, %%fs" : : "r" ((0x1234 << 3) | 1));
1376 }
1377 if (setjmp(jmp_env) == 0) {
1378 /* null data segment is valid */
1379 asm volatile ("movl %0, %%fs" : : "r" (3));
1380 /* null stack segment */
1381 asm volatile ("movl %0, %%ss" : : "r" (3));
1382 }
1383
1384 ldt.entry_number = 1;
1385 ldt.base_addr = (unsigned long)&seg_data1;
1386 ldt.limit = (sizeof(seg_data1) + 0xfff) >> 12;
1387 ldt.seg_32bit = 1;
1388 ldt.contents = MODIFY_LDT_CONTENTS_DATA;
1389 ldt.read_exec_only = 0;
1390 ldt.limit_in_pages = 1;
1391 ldt.seg_not_present = 1;
1392 ldt.useable = 1;
1393 modify_ldt(1, &ldt, sizeof(ldt)); /* write ldt entry */
1394
1395 if (setjmp(jmp_env) == 0) {
1396 /* segment not present */
1397 asm volatile ("movl %0, %%fs" : : "r" (MK_SEL(1)));
1398 }
1399
1400 /* test SEGV reporting */
1401 printf("PF exception:\n");
1402 if (setjmp(jmp_env) == 0) {
1403 val = 1;
1404 /* we add a nop to test a weird PC retrieval case */
1405 asm volatile ("nop");
1406 /* now store in an invalid address */
1407 *(char *)0x1234 = 1;
1408 }
1409
1410 /* test SEGV reporting */
1411 printf("PF exception:\n");
1412 if (setjmp(jmp_env) == 0) {
1413 val = 1;
1414 /* read from an invalid address */
1415 v1 = *(char *)0x1234;
1416 }
1417
1418 /* test illegal instruction reporting */
1419 printf("UD2 exception:\n");
1420 if (setjmp(jmp_env) == 0) {
1421 /* now execute an invalid instruction */
1422 asm volatile("ud2");
1423 }
1424 printf("lock nop exception:\n");
1425 if (setjmp(jmp_env) == 0) {
1426 /* now execute an invalid instruction */
1427 asm volatile("lock nop");
1428 }
1429
1430 printf("INT exception:\n");
1431 if (setjmp(jmp_env) == 0) {
1432 asm volatile ("int $0xfd");
1433 }
1434 if (setjmp(jmp_env) == 0) {
1435 asm volatile ("int $0x01");
1436 }
1437 if (setjmp(jmp_env) == 0) {
1438 asm volatile (".byte 0xcd, 0x03");
1439 }
1440 if (setjmp(jmp_env) == 0) {
1441 asm volatile ("int $0x04");
1442 }
1443 if (setjmp(jmp_env) == 0) {
1444 asm volatile ("int $0x05");
1445 }
1446
1447 printf("INT3 exception:\n");
1448 if (setjmp(jmp_env) == 0) {
1449 asm volatile ("int3");
1450 }
1451
1452 printf("CLI exception:\n");
1453 if (setjmp(jmp_env) == 0) {
1454 asm volatile ("cli");
1455 }
1456
1457 printf("STI exception:\n");
1458 if (setjmp(jmp_env) == 0) {
1459 asm volatile ("cli");
1460 }
1461
1462 printf("INTO exception:\n");
1463 if (setjmp(jmp_env) == 0) {
1464 /* overflow exception */
1465 asm volatile ("addl $1, %0 ; into" : : "r" (0x7fffffff));
1466 }
1467
1468 printf("OUTB exception:\n");
1469 if (setjmp(jmp_env) == 0) {
1470 asm volatile ("outb %%al, %%dx" : : "d" (0x4321), "a" (0));
1471 }
1472
1473 printf("INB exception:\n");
1474 if (setjmp(jmp_env) == 0) {
1475 asm volatile ("inb %%dx, %%al" : "=a" (val) : "d" (0x4321));
1476 }
1477
1478 printf("REP OUTSB exception:\n");
1479 if (setjmp(jmp_env) == 0) {
1480 asm volatile ("rep outsb" : : "d" (0x4321), "S" (tab), "c" (1));
1481 }
1482
1483 printf("REP INSB exception:\n");
1484 if (setjmp(jmp_env) == 0) {
1485 asm volatile ("rep insb" : : "d" (0x4321), "D" (tab), "c" (1));
1486 }
1487
1488 printf("HLT exception:\n");
1489 if (setjmp(jmp_env) == 0) {
1490 asm volatile ("hlt");
1491 }
1492
1493 printf("single step exception:\n");
1494 val = 0;
1495 if (setjmp(jmp_env) == 0) {
1496 asm volatile ("pushf\n"
1497 "orl $0x00100, (%%esp)\n"
1498 "popf\n"
1499 "movl $0xabcd, %0\n"
1500 "movl $0x0, %0\n" : "=m" (val) : : "cc", "memory");
1501 }
1502 printf("val=0x%x\n", val);
1503 }
1504
1505 /* specific precise single step test */
1506 void sig_trap_handler(int sig, siginfo_t *info, void *puc)
1507 {
1508 struct ucontext *uc = puc;
1509 printf("EIP=0x%08x\n", uc->uc_mcontext.gregs[REG_EIP]);
1510 }
1511
1512 const uint8_t sstep_buf1[4] = { 1, 2, 3, 4};
1513 uint8_t sstep_buf2[4];
1514
1515 void test_single_step(void)
1516 {
1517 struct sigaction act;
1518 volatile int val;
1519 int i;
1520
1521 val = 0;
1522 act.sa_sigaction = sig_trap_handler;
1523 sigemptyset(&act.sa_mask);
1524 act.sa_flags = SA_SIGINFO;
1525 sigaction(SIGTRAP, &act, NULL);
1526 asm volatile ("pushf\n"
1527 "orl $0x00100, (%%esp)\n"
1528 "popf\n"
1529 "movl $0xabcd, %0\n"
1530
1531 /* jmp test */
1532 "movl $3, %%ecx\n"
1533 "1:\n"
1534 "addl $1, %0\n"
1535 "decl %%ecx\n"
1536 "jnz 1b\n"
1537
1538 /* movsb: the single step should stop at each movsb iteration */
1539 "movl $sstep_buf1, %%esi\n"
1540 "movl $sstep_buf2, %%edi\n"
1541 "movl $0, %%ecx\n"
1542 "rep movsb\n"
1543 "movl $3, %%ecx\n"
1544 "rep movsb\n"
1545 "movl $1, %%ecx\n"
1546 "rep movsb\n"
1547
1548 /* cmpsb: the single step should stop at each cmpsb iteration */
1549 "movl $sstep_buf1, %%esi\n"
1550 "movl $sstep_buf2, %%edi\n"
1551 "movl $0, %%ecx\n"
1552 "rep cmpsb\n"
1553 "movl $4, %%ecx\n"
1554 "rep cmpsb\n"
1555
1556 /* getpid() syscall: single step should skip one
1557 instruction */
1558 "movl $20, %%eax\n"
1559 "int $0x80\n"
1560 "movl $0, %%eax\n"
1561
1562 /* when modifying SS, trace is not done on the next
1563 instruction */
1564 "movl %%ss, %%ecx\n"
1565 "movl %%ecx, %%ss\n"
1566 "addl $1, %0\n"
1567 "movl $1, %%eax\n"
1568 "movl %%ecx, %%ss\n"
1569 "jmp 1f\n"
1570 "addl $1, %0\n"
1571 "1:\n"
1572 "movl $1, %%eax\n"
1573 "pushl %%ecx\n"
1574 "popl %%ss\n"
1575 "addl $1, %0\n"
1576 "movl $1, %%eax\n"
1577
1578 "pushf\n"
1579 "andl $~0x00100, (%%esp)\n"
1580 "popf\n"
1581 : "=m" (val)
1582 :
1583 : "cc", "memory", "eax", "ecx", "esi", "edi");
1584 printf("val=%d\n", val);
1585 for(i = 0; i < 4; i++)
1586 printf("sstep_buf2[%d] = %d\n", i, sstep_buf2[i]);
1587 }
1588
1589 /* self modifying code test */
1590 uint8_t code[] = {
1591 0xb8, 0x1, 0x00, 0x00, 0x00, /* movl $1, %eax */
1592 0xc3, /* ret */
1593 };
1594
1595 asm("smc_code2:\n"
1596 "movl 4(%esp), %eax\n"
1597 "movl %eax, smc_patch_addr2 + 1\n"
1598 "nop\n"
1599 "nop\n"
1600 "nop\n"
1601 "nop\n"
1602 "nop\n"
1603 "nop\n"
1604 "nop\n"
1605 "nop\n"
1606 "smc_patch_addr2:\n"
1607 "movl $1, %eax\n"
1608 "ret\n");
1609
1610 typedef int FuncType(void);
1611 extern int smc_code2(int);
1612 void test_self_modifying_code(void)
1613 {
1614 int i;
1615
1616 printf("self modifying code:\n");
1617 printf("func1 = 0x%x\n", ((FuncType *)code)());
1618 for(i = 2; i <= 4; i++) {
1619 code[1] = i;
1620 printf("func%d = 0x%x\n", i, ((FuncType *)code)());
1621 }
1622
1623 /* more difficult test : the modified code is just after the
1624 modifying instruction. It is forbidden in Intel specs, but it
1625 is used by old DOS programs */
1626 for(i = 2; i <= 4; i++) {
1627 printf("smc_code2(%d) = %d\n", i, smc_code2(i));
1628 }
1629 }
1630
1631 int enter_stack[4096];
1632
1633 #define TEST_ENTER(size, stack_type, level)\
1634 {\
1635 int esp_save, esp_val, ebp_val, ebp_save, i;\
1636 stack_type *ptr, *stack_end, *stack_ptr;\
1637 memset(enter_stack, 0, sizeof(enter_stack));\
1638 stack_end = stack_ptr = (stack_type *)(enter_stack + 4096);\
1639 ebp_val = (long)stack_ptr;\
1640 for(i=1;i<=32;i++)\
1641 *--stack_ptr = i;\
1642 esp_val = (long)stack_ptr;\
1643 asm("movl %%esp, %[esp_save]\n"\
1644 "movl %%ebp, %[ebp_save]\n"\
1645 "movl %[esp_val], %%esp\n"\
1646 "movl %[ebp_val], %%ebp\n"\
1647 "enter" size " $12, $" #level "\n"\
1648 "movl %%esp, %[esp_val]\n"\
1649 "movl %%ebp, %[ebp_val]\n"\
1650 "movl %[esp_save], %%esp\n"\
1651 "movl %[ebp_save], %%ebp\n"\
1652 : [esp_save] "=r" (esp_save),\
1653 [ebp_save] "=r" (ebp_save),\
1654 [esp_val] "=r" (esp_val),\
1655 [ebp_val] "=r" (ebp_val)\
1656 : "[esp_val]" (esp_val),\
1657 "[ebp_val]" (ebp_val));\
1658 printf("level=%d:\n", level);\
1659 printf("esp_val=0x%08lx\n", esp_val - (long)stack_end);\
1660 printf("ebp_val=0x%08lx\n", ebp_val - (long)stack_end);\
1661 for(ptr = (stack_type *)esp_val; ptr < stack_end; ptr++)\
1662 printf("%08x\n", ptr[0]);\
1663 }
1664
1665 static void test_enter(void)
1666 {
1667 TEST_ENTER("l", uint32_t, 0);
1668 TEST_ENTER("l", uint32_t, 1);
1669 TEST_ENTER("l", uint32_t, 2);
1670 TEST_ENTER("l", uint32_t, 31);
1671
1672 TEST_ENTER("w", uint16_t, 0);
1673 TEST_ENTER("w", uint16_t, 1);
1674 TEST_ENTER("w", uint16_t, 2);
1675 TEST_ENTER("w", uint16_t, 31);
1676 }
1677
1678 #ifdef TEST_SSE
1679
1680 typedef int __m64 __attribute__ ((__mode__ (__V2SI__)));
1681 typedef int __m128 __attribute__ ((__mode__(__V4SF__)));
1682
1683 typedef union {
1684 double d[2];
1685 float s[4];
1686 uint32_t l[4];
1687 uint64_t q[2];
1688 __m128 dq;
1689 } XMMReg;
1690
1691 static uint64_t __attribute__((aligned(16))) test_values[4][2] = {
1692 { 0x456723c698694873, 0xdc515cff944a58ec },
1693 { 0x1f297ccd58bad7ab, 0x41f21efba9e3e146 },
1694 { 0x007c62c2085427f8, 0x231be9e8cde7438d },
1695 { 0x0f76255a085427f8, 0xc233e9e8c4c9439a },
1696 };
1697
1698 #define SSE_OP(op)\
1699 {\
1700 asm volatile (#op " %2, %0" : "=x" (r.dq) : "0" (a.dq), "x" (b.dq));\
1701 printf("%-9s: a=%016llx%016llx b=%016llx%016llx r=%016llx%016llx\n",\
1702 #op,\
1703 a.q[1], a.q[0],\
1704 b.q[1], b.q[0],\
1705 r.q[1], r.q[0]);\
1706 }
1707
1708 #define SSE_OP2(op)\
1709 {\
1710 int i;\
1711 for(i=0;i<2;i++) {\
1712 a.q[0] = test_values[2*i][0];\
1713 a.q[1] = test_values[2*i][1];\
1714 b.q[0] = test_values[2*i+1][0];\
1715 b.q[1] = test_values[2*i+1][1];\
1716 SSE_OP(op);\
1717 }\
1718 }
1719
1720 #define MMX_OP2(op)\
1721 {\
1722 int i;\
1723 for(i=0;i<2;i++) {\
1724 a.q[0] = test_values[2*i][0];\
1725 b.q[0] = test_values[2*i+1][0];\
1726 asm volatile (#op " %2, %0" : "=y" (r.q[0]) : "0" (a.q[0]), "y" (b.q[0]));\
1727 printf("%-9s: a=%016llx b=%016llx r=%016llx\n",\
1728 #op,\
1729 a.q[0],\
1730 b.q[0],\
1731 r.q[0]);\
1732 }\
1733 SSE_OP2(op);\
1734 }
1735
1736 #define SHUF_OP(op, ib)\
1737 {\
1738 a.q[0] = test_values[0][0];\
1739 a.q[1] = test_values[0][1];\
1740 b.q[0] = test_values[1][0];\
1741 b.q[1] = test_values[1][1];\
1742 asm volatile (#op " $" #ib ", %2, %0" : "=x" (r.dq) : "0" (a.dq), "x" (b.dq));\
1743 printf("%-9s: a=%016llx%016llx b=%016llx%016llx ib=%02x r=%016llx%016llx\n",\
1744 #op,\
1745 a.q[1], a.q[0],\
1746 b.q[1], b.q[0],\
1747 ib,\
1748 r.q[1], r.q[0]);\
1749 }
1750
1751 #define PSHUF_OP(op, ib)\
1752 {\
1753 int i;\
1754 for(i=0;i<2;i++) {\
1755 a.q[0] = test_values[2*i][0];\
1756 a.q[1] = test_values[2*i][1];\
1757 asm volatile (#op " $" #ib ", %1, %0" : "=x" (r.dq) : "x" (a.dq));\
1758 printf("%-9s: a=%016llx%016llx ib=%02x r=%016llx%016llx\n",\
1759 #op,\
1760 a.q[1], a.q[0],\
1761 ib,\
1762 r.q[1], r.q[0]);\
1763 }\
1764 }
1765
1766 #define SHIFT_IM(op, ib)\
1767 {\
1768 int i;\
1769 for(i=0;i<2;i++) {\
1770 a.q[0] = test_values[2*i][0];\
1771 a.q[1] = test_values[2*i][1];\
1772 asm volatile (#op " $" #ib ", %0" : "=x" (r.dq) : "0" (a.dq));\
1773 printf("%-9s: a=%016llx%016llx ib=%02x r=%016llx%016llx\n",\
1774 #op,\
1775 a.q[1], a.q[0],\
1776 ib,\
1777 r.q[1], r.q[0]);\
1778 }\
1779 }
1780
1781 #define SHIFT_OP(op, ib)\
1782 {\
1783 int i;\
1784 SHIFT_IM(op, ib);\
1785 for(i=0;i<2;i++) {\
1786 a.q[0] = test_values[2*i][0];\
1787 a.q[1] = test_values[2*i][1];\
1788 b.q[0] = ib;\
1789 b.q[1] = 0;\
1790 asm volatile (#op " %2, %0" : "=x" (r.dq) : "0" (a.dq), "x" (b.dq));\
1791 printf("%-9s: a=%016llx%016llx b=%016llx%016llx r=%016llx%016llx\n",\
1792 #op,\
1793 a.q[1], a.q[0],\
1794 b.q[1], b.q[0],\
1795 r.q[1], r.q[0]);\
1796 }\
1797 }
1798
1799 #define MOVMSK(op)\
1800 {\
1801 int i, reg;\
1802 for(i=0;i<2;i++) {\
1803 a.q[0] = test_values[2*i][0];\
1804 a.q[1] = test_values[2*i][1];\
1805 asm volatile (#op " %1, %0" : "=r" (reg) : "x" (a.dq));\
1806 printf("%-9s: a=%016llx%016llx r=%08x\n",\
1807 #op,\
1808 a.q[1], a.q[0],\
1809 reg);\
1810 }\
1811 }
1812
1813 #define SSE_OPS(a) \
1814 SSE_OP(a ## ps);\
1815 SSE_OP(a ## ss);
1816
1817 #define SSE_OPD(a) \
1818 SSE_OP(a ## pd);\
1819 SSE_OP(a ## sd);
1820
1821 #define SSE_COMI(op, field)\
1822 {\
1823 unsigned int eflags;\
1824 XMMReg a, b;\
1825 a.field[0] = a1;\
1826 b.field[0] = b1;\
1827 asm volatile (#op " %2, %1\n"\
1828 "pushf\n"\
1829 "pop %0\n"\
1830 : "=m" (eflags)\
1831 : "x" (a.dq), "x" (b.dq));\
1832 printf("%-9s: a=%f b=%f cc=%04x\n",\
1833 #op, a1, b1,\
1834 eflags & (CC_C | CC_P | CC_Z | CC_S | CC_O | CC_A));\
1835 }
1836
1837 void test_sse_comi(double a1, double b1)
1838 {
1839 SSE_COMI(ucomiss, s);
1840 SSE_COMI(ucomisd, d);
1841 SSE_COMI(comiss, s);
1842 SSE_COMI(comisd, d);
1843 }
1844
1845 #define CVT_OP_XMM(op)\
1846 {\
1847 asm volatile (#op " %1, %0" : "=x" (r.dq) : "x" (a.dq));\
1848 printf("%-9s: a=%016llx%016llx r=%016llx%016llx\n",\
1849 #op,\
1850 a.q[1], a.q[0],\
1851 r.q[1], r.q[0]);\
1852 }
1853
1854 #define CVT_OP_XMM2MMX(op)\
1855 {\
1856 asm volatile (#op " %1, %0" : "=y" (r.q[0]) : "x" (a.dq));\
1857 printf("%-9s: a=%016llx%016llx r=%016llx\n",\
1858 #op,\
1859 a.q[1], a.q[0],\
1860 r.q[0]);\
1861 }
1862
1863 #define CVT_OP_MMX2XMM(op)\
1864 {\
1865 asm volatile (#op " %1, %0" : "=x" (r.dq) : "y" (a.q[0]));\
1866 printf("%-9s: a=%016llx r=%016llx%016llx\n",\
1867 #op,\
1868 a.q[0],\
1869 r.q[1], r.q[0]);\
1870 }
1871
1872 #define CVT_OP_REG2XMM(op)\
1873 {\
1874 asm volatile (#op " %1, %0" : "=x" (r.dq) : "r" (a.l[0]));\
1875 printf("%-9s: a=%08x r=%016llx%016llx\n",\
1876 #op,\
1877 a.l[0],\
1878 r.q[1], r.q[0]);\
1879 }
1880
1881 #define CVT_OP_XMM2REG(op)\
1882 {\
1883 asm volatile (#op " %1, %0" : "=r" (r.l[0]) : "x" (a.dq));\
1884 printf("%-9s: a=%016llx%016llx r=%08x\n",\
1885 #op,\
1886 a.q[1], a.q[0],\
1887 r.l[0]);\
1888 }
1889
1890 struct fpxstate {
1891 uint16_t fpuc;
1892 uint16_t fpus;
1893 uint16_t fptag;
1894 uint16_t fop;
1895 uint32_t fpuip;
1896 uint16_t cs_sel;
1897 uint16_t dummy0;
1898 uint32_t fpudp;
1899 uint16_t ds_sel;
1900 uint16_t dummy1;
1901 uint32_t mxcsr;
1902 uint32_t mxcsr_mask;
1903 uint8_t fpregs1[8 * 16];
1904 uint8_t xmm_regs[8 * 16];
1905 uint8_t dummy2[224];
1906 };
1907
1908 static struct fpxstate fpx_state __attribute__((aligned(16)));
1909 static struct fpxstate fpx_state2 __attribute__((aligned(16)));
1910
1911 void test_fxsave(void)
1912 {
1913 struct fpxstate *fp = &fpx_state;
1914 struct fpxstate *fp2 = &fpx_state2;
1915 int i;
1916 XMMReg a, b;
1917 a.q[0] = test_values[0][0];
1918 a.q[1] = test_values[0][1];
1919 b.q[0] = test_values[1][0];
1920 b.q[1] = test_values[1][1];
1921
1922 asm("movdqa %2, %%xmm0\n"
1923 "movdqa %3, %%xmm7\n"
1924 " fld1\n"
1925 " fldpi\n"
1926 " fldln2\n"
1927 " fxsave %0\n"
1928 " fxrstor %0\n"
1929 " fxsave %1\n"
1930 " fninit\n"
1931 : "=m" (*(uint32_t *)fp2), "=m" (*(uint32_t *)fp)
1932 : "m" (a), "m" (b));
1933 printf("fpuc=%04x\n", fp->fpuc);
1934 printf("fpus=%04x\n", fp->fpus);
1935 printf("fptag=%04x\n", fp->fptag);
1936 for(i = 0; i < 3; i++) {
1937 printf("ST%d: %016llx %04x\n",
1938 i,
1939 *(uint64_t *)&fp->fpregs1[i * 16],
1940 *(uint16_t *)&fp->fpregs1[i * 16 + 8]);
1941 }
1942 printf("mxcsr=%08x\n", fp->mxcsr & 0x1f80);
1943 for(i = 0; i < 8; i++) {
1944 printf("xmm%d: %016llx%016llx\n",
1945 i,
1946 *(uint64_t *)&fp->xmm_regs[i * 16],
1947 *(uint64_t *)&fp->xmm_regs[i * 16 + 8]);
1948 }
1949 }
1950
1951 void test_sse(void)
1952 {
1953 XMMReg r, a, b;
1954
1955 MMX_OP2(punpcklbw);
1956 MMX_OP2(punpcklwd);
1957 MMX_OP2(punpckldq);
1958 MMX_OP2(packsswb);
1959 MMX_OP2(pcmpgtb);
1960 MMX_OP2(pcmpgtw);
1961 MMX_OP2(pcmpgtd);
1962 MMX_OP2(packuswb);
1963 MMX_OP2(punpckhbw);
1964 MMX_OP2(punpckhwd);
1965 MMX_OP2(punpckhdq);
1966 MMX_OP2(packssdw);
1967 MMX_OP2(pcmpeqb);
1968 MMX_OP2(pcmpeqw);
1969 MMX_OP2(pcmpeqd);
1970
1971 MMX_OP2(paddq);
1972 MMX_OP2(pmullw);
1973 MMX_OP2(psubusb);
1974 MMX_OP2(psubusw);
1975 MMX_OP2(pminub);
1976 MMX_OP2(pand);
1977 MMX_OP2(paddusb);
1978 MMX_OP2(paddusw);
1979 MMX_OP2(pmaxub);
1980 MMX_OP2(pandn);
1981
1982 MMX_OP2(pmulhuw);
1983 MMX_OP2(pmulhw);
1984
1985 MMX_OP2(psubsb);
1986 MMX_OP2(psubsw);
1987 MMX_OP2(pminsw);
1988 MMX_OP2(por);
1989 MMX_OP2(paddsb);
1990 MMX_OP2(paddsw);
1991 MMX_OP2(pmaxsw);
1992 MMX_OP2(pxor);
1993 MMX_OP2(pmuludq);
1994 MMX_OP2(pmaddwd);
1995 MMX_OP2(psadbw);
1996 MMX_OP2(psubb);
1997 MMX_OP2(psubw);
1998 MMX_OP2(psubd);
1999 MMX_OP2(psubq);
2000 MMX_OP2(paddb);
2001 MMX_OP2(paddw);
2002 MMX_OP2(paddd);
2003
2004 MMX_OP2(pavgb);
2005 MMX_OP2(pavgw);
2006
2007 asm volatile ("pinsrw $1, %1, %0" : "=y" (r.q[0]) : "r" (0x12345678));
2008 printf("%-9s: r=%016llx\n", "pinsrw", r.q[0]);
2009
2010 asm volatile ("pinsrw $5, %1, %0" : "=x" (r.dq) : "r" (0x12345678));
2011 printf("%-9s: r=%016llx%016llx\n", "pinsrw", r.q[1], r.q[0]);
2012
2013 a.q[0] = test_values[0][0];
2014 a.q[1] = test_values[0][1];
2015 asm volatile ("pextrw $1, %1, %0" : "=r" (r.l[0]) : "y" (a.q[0]));
2016 printf("%-9s: r=%08x\n", "pextrw", r.l[0]);
2017
2018 asm volatile ("pextrw $5, %1, %0" : "=r" (r.l[0]) : "x" (a.dq));
2019 printf("%-9s: r=%08x\n", "pextrw", r.l[0]);
2020
2021 asm volatile ("pmovmskb %1, %0" : "=r" (r.l[0]) : "y" (a.q[0]));
2022 printf("%-9s: r=%08x\n", "pmovmskb", r.l[0]);
2023
2024 asm volatile ("pmovmskb %1, %0" : "=r" (r.l[0]) : "x" (a.dq));
2025 printf("%-9s: r=%08x\n", "pmovmskb", r.l[0]);
2026
2027 {
2028 r.q[0] = -1;
2029 r.q[1] = -1;
2030
2031 a.q[0] = test_values[0][0];
2032 a.q[1] = test_values[0][1];
2033 b.q[0] = test_values[1][0];
2034 b.q[1] = test_values[1][1];
2035 asm volatile("maskmovq %1, %0" :
2036 : "y" (a.q[0]), "y" (b.q[0]), "D" (&r)
2037 : "memory");
2038 printf("%-9s: r=%016llx a=%016llx b=%016llx\n",
2039 "maskmov",
2040 r.q[0],
2041 a.q[0],
2042 b.q[0]);
2043 asm volatile("maskmovdqu %1, %0" :
2044 : "x" (a.dq), "x" (b.dq), "D" (&r)
2045 : "memory");
2046 printf("%-9s: r=%016llx%016llx a=%016llx%016llx b=%016llx%016llx\n",
2047 "maskmov",
2048 r.q[1], r.q[0],
2049 a.q[1], a.q[0],
2050 b.q[1], b.q[0]);
2051 }
2052
2053 asm volatile ("emms");
2054
2055 SSE_OP2(punpcklqdq);
2056 SSE_OP2(punpckhqdq);
2057 SSE_OP2(andps);
2058 SSE_OP2(andpd);
2059 SSE_OP2(andnps);
2060 SSE_OP2(andnpd);
2061 SSE_OP2(orps);
2062 SSE_OP2(orpd);
2063 SSE_OP2(xorps);
2064 SSE_OP2(xorpd);
2065
2066 SSE_OP2(unpcklps);
2067 SSE_OP2(unpcklpd);
2068 SSE_OP2(unpckhps);
2069 SSE_OP2(unpckhpd);
2070
2071 SHUF_OP(shufps, 0x78);
2072 SHUF_OP(shufpd, 0x02);
2073
2074 PSHUF_OP(pshufd, 0x78);
2075 PSHUF_OP(pshuflw, 0x78);
2076 PSHUF_OP(pshufhw, 0x78);
2077
2078 SHIFT_OP(psrlw, 7);
2079 SHIFT_OP(psrlw, 16);
2080 SHIFT_OP(psraw, 7);
2081 SHIFT_OP(psraw, 16);
2082 SHIFT_OP(psllw, 7);
2083 SHIFT_OP(psllw, 16);
2084
2085 SHIFT_OP(psrld, 7);
2086 SHIFT_OP(psrld, 32);
2087 SHIFT_OP(psrad, 7);
2088 SHIFT_OP(psrad, 32);
2089 SHIFT_OP(pslld, 7);
2090 SHIFT_OP(pslld, 32);
2091
2092 SHIFT_OP(psrlq, 7);
2093 SHIFT_OP(psrlq, 32);
2094 SHIFT_OP(psllq, 7);
2095 SHIFT_OP(psllq, 32);
2096
2097 SHIFT_IM(psrldq, 16);
2098 SHIFT_IM(psrldq, 7);
2099 SHIFT_IM(pslldq, 16);
2100 SHIFT_IM(pslldq, 7);
2101
2102 MOVMSK(movmskps);
2103 MOVMSK(movmskpd);
2104
2105 /* FPU specific ops */
2106
2107 {
2108 uint32_t mxcsr;
2109 asm volatile("stmxcsr %0" : "=m" (mxcsr));
2110 printf("mxcsr=%08x\n", mxcsr & 0x1f80);
2111 asm volatile("ldmxcsr %0" : : "m" (mxcsr));
2112 }
2113
2114 test_sse_comi(2, -1);
2115 test_sse_comi(2, 2);
2116 test_sse_comi(2, 3);
2117
2118 a.s[0] = 2.7;
2119 a.s[1] = 3.4;
2120 a.s[2] = 4;
2121 a.s[3] = -6.3;
2122 b.s[0] = 45.7;
2123 b.s[1] = 353.4;
2124 b.s[2] = 4;
2125 b.s[3] = 56.3;
2126 SSE_OPS(add);
2127 SSE_OPS(mul);
2128 SSE_OPS(sub);
2129 SSE_OPS(min);
2130 SSE_OPS(div);
2131 SSE_OPS(max);
2132 SSE_OPS(sqrt);
2133 SSE_OPS(cmpeq);
2134 SSE_OPS(cmplt);
2135 SSE_OPS(cmple);
2136 SSE_OPS(cmpunord);
2137 SSE_OPS(cmpneq);
2138 SSE_OPS(cmpnlt);
2139 SSE_OPS(cmpnle);
2140 SSE_OPS(cmpord);
2141
2142 a.d[0] = 2.7;
2143 a.d[1] = -3.4;
2144 b.d[0] = 45.7;
2145 b.d[1] = -53.4;
2146 SSE_OPD(add);
2147 SSE_OPD(mul);
2148 SSE_OPD(sub);
2149 SSE_OPD(min);
2150 SSE_OPD(div);
2151 SSE_OPD(max);
2152 SSE_OPD(sqrt);
2153 SSE_OPD(cmpeq);
2154 SSE_OPD(cmplt);
2155 SSE_OPD(cmple);
2156 SSE_OPD(cmpunord);
2157 SSE_OPD(cmpneq);
2158 SSE_OPD(cmpnlt);
2159 SSE_OPD(cmpnle);
2160 SSE_OPD(cmpord);
2161
2162 /* float to float/int */
2163 a.s[0] = 2.7;
2164 a.s[1] = 3.4;
2165 a.s[2] = 4;
2166 a.s[3] = -6.3;
2167 CVT_OP_XMM(cvtps2pd);
2168 CVT_OP_XMM(cvtss2sd);
2169 CVT_OP_XMM2MMX(cvtps2pi);
2170 CVT_OP_XMM2MMX(cvttps2pi);
2171 CVT_OP_XMM2REG(cvtss2si);
2172 CVT_OP_XMM2REG(cvttss2si);
2173 CVT_OP_XMM(cvtps2dq);
2174 CVT_OP_XMM(cvttps2dq);
2175
2176 a.d[0] = 2.6;
2177 a.d[1] = -3.4;
2178 CVT_OP_XMM(cvtpd2ps);
2179 CVT_OP_XMM(cvtsd2ss);
2180 CVT_OP_XMM2MMX(cvtpd2pi);
2181 CVT_OP_XMM2MMX(cvttpd2pi);
2182 CVT_OP_XMM2REG(cvtsd2si);
2183 CVT_OP_XMM2REG(cvttsd2si);
2184 CVT_OP_XMM(cvtpd2dq);
2185 CVT_OP_XMM(cvttpd2dq);
2186
2187 /* int to float */
2188 a.l[0] = -6;
2189 a.l[1] = 2;
2190 a.l[2] = 100;
2191 a.l[3] = -60000;
2192 CVT_OP_MMX2XMM(cvtpi2ps);
2193 CVT_OP_MMX2XMM(cvtpi2pd);
2194 CVT_OP_REG2XMM(cvtsi2ss);
2195 CVT_OP_REG2XMM(cvtsi2sd);
2196 CVT_OP_XMM(cvtdq2ps);
2197 CVT_OP_XMM(cvtdq2pd);
2198
2199 /* XXX: test PNI insns */
2200 #if 0
2201 SSE_OP2(movshdup);
2202 #endif
2203 asm volatile ("emms");
2204 }
2205
2206 #endif
2207
2208 static void *call_end __init_call = NULL;
2209
2210 int main(int argc, char **argv)
2211 {
2212 void **ptr;
2213 void (*func)(void);
2214
2215 ptr = &call_start + 1;
2216 while (*ptr != NULL) {
2217 func = *ptr++;
2218 func();
2219 }
2220 test_bsx();
2221 test_mul();
2222 test_jcc();
2223 test_floats();
2224 test_bcd();
2225 test_xchg();
2226 test_string();
2227 test_misc();
2228 test_lea();
2229 test_segs();
2230 test_code16();
2231 #ifdef TEST_VM86
2232 test_vm86();
2233 #endif
2234 test_exceptions();
2235 test_self_modifying_code();
2236 test_single_step();
2237 test_enter();
2238 #ifdef TEST_SSE
2239 test_sse();
2240 test_fxsave();
2241 #endif
2242 return 0;
2243 }