mirror of
https://github.com/ioacademy-jikim/debugging
synced 2025-06-08 16:36:21 +00:00
219 lines
6.5 KiB
C
219 lines
6.5 KiB
C
#include <config.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include "tests/asm.h"
|
|
#include "tests/malloc.h"
|
|
#include <string.h>
|
|
|
|
const unsigned int vec0[4]
|
|
= { 0x12345678, 0x11223344, 0x55667788, 0x87654321 };
|
|
|
|
const unsigned int vec1[4]
|
|
= { 0xABCDEF01, 0xAABBCCDD, 0xEEFF0011, 0x10FEDCBA };
|
|
|
|
const unsigned int vecZ[4]
|
|
= { 0, 0, 0, 0 };
|
|
|
|
__attribute__((noinline))
|
|
void do_fxsave ( void* p, int rexw ) {
|
|
if (rexw) {
|
|
#ifdef HAVE_AS_AMD64_FXSAVE64
|
|
asm __volatile__("fxsave64 (%0)" : : "r" (p) : "memory" );
|
|
#else
|
|
asm __volatile__("rex64/fxsave (%0)" : : "r" (p) : "memory" );
|
|
#endif
|
|
} else {
|
|
asm __volatile__("fxsave (%0)" : : "r" (p) : "memory" );
|
|
}
|
|
}
|
|
|
|
__attribute__((noinline))
|
|
void do_fxrstor ( void* p, int rexw ) {
|
|
if (rexw) {
|
|
#ifdef HAVE_AS_AMD64_FXSAVE64
|
|
asm __volatile__("fxrstor64 (%0)" : : "r" (p) : "memory" );
|
|
#else
|
|
asm __volatile__("rex64/fxrstor (%0)" : : "r" (p) : "memory" );
|
|
#endif
|
|
} else {
|
|
asm __volatile__("fxrstor (%0)" : : "r" (p) : "memory" );
|
|
}
|
|
}
|
|
|
|
void do_zeroise ( void )
|
|
{
|
|
asm __volatile__("finit");
|
|
asm __volatile__(
|
|
"fldz\n\t"
|
|
"fldz\n\t"
|
|
"fldz\n\t"
|
|
"fldz\n\t"
|
|
"fldz\n\t"
|
|
"fldz\n\t"
|
|
"fldz\n\t"
|
|
"fldz\n\t"
|
|
"finit\n");
|
|
#ifndef VGP_amd64_darwin
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm0");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm1");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm2");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm3");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm4");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm5");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm6");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm7");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm8");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm9");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm10");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm11");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm12");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm13");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm14");
|
|
asm __volatile__("movups " VG_SYM(vecZ) ", %xmm15");
|
|
#else
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm0");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm1");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm2");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm3");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm4");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm5");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm6");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm7");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm8");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm9");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm10");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm11");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm12");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm13");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm14");
|
|
asm __volatile__("movups " VG_SYM(vecZ) "(%rip), %xmm15");
|
|
#endif
|
|
asm __volatile__(
|
|
"pushq $0\n\t"
|
|
"ldmxcsr 0(%rsp)\n\t"
|
|
"addq $8,%rsp\n");
|
|
}
|
|
|
|
/* set up the FP and SSE state, and then dump it. */
|
|
void do_setup_then_fxsave ( void* p, int rexw )
|
|
{
|
|
asm __volatile__("finit");
|
|
asm __volatile__("fldpi");
|
|
asm __volatile__("fld1");
|
|
asm __volatile__("fldln2");
|
|
asm __volatile__("fldlg2");
|
|
asm __volatile__("fld %st(3)");
|
|
asm __volatile__("fld %st(3)");
|
|
asm __volatile__("fld1");
|
|
asm __volatile__("movups (%0), %%xmm0" : : "r"(&vec0[0]) : "xmm0" );
|
|
asm __volatile__("movups (%0), %%xmm1" : : "r"(&vec1[0]) : "xmm1" );
|
|
asm __volatile__("xorps %xmm2, %xmm2");
|
|
asm __volatile__("movaps %xmm0, %xmm3");
|
|
asm __volatile__("movaps %xmm1, %xmm4");
|
|
asm __volatile__("movaps %xmm2, %xmm5");
|
|
asm __volatile__("movaps %xmm0, %xmm6");
|
|
asm __volatile__("movaps %xmm1, %xmm7");
|
|
asm __volatile__("movaps %xmm1, %xmm8");
|
|
asm __volatile__("movaps %xmm2, %xmm9");
|
|
asm __volatile__("movaps %xmm0, %xmm10");
|
|
asm __volatile__("movaps %xmm1, %xmm11");
|
|
asm __volatile__("movaps %xmm1, %xmm12");
|
|
asm __volatile__("movaps %xmm2, %xmm13");
|
|
asm __volatile__("movaps %xmm0, %xmm14");
|
|
asm __volatile__("movaps %xmm1, %xmm15");
|
|
do_fxsave(p, rexw);
|
|
}
|
|
|
|
int isFPLsbs ( int i )
|
|
{
|
|
int q;
|
|
q = 32; if (i == q || i == q+1) return 1;
|
|
q = 48; if (i == q || i == q+1) return 1;
|
|
q = 64; if (i == q || i == q+1) return 1;
|
|
q = 80; if (i == q || i == q+1) return 1;
|
|
q = 96; if (i == q || i == q+1) return 1;
|
|
q = 112; if (i == q || i == q+1) return 1;
|
|
q = 128; if (i == q || i == q+1) return 1;
|
|
q = 144; if (i == q || i == q+1) return 1;
|
|
return 0;
|
|
}
|
|
|
|
void show ( unsigned char* buf, int xx )
|
|
{
|
|
int i;
|
|
for (i = 0; i < 512; i++) {
|
|
if ((i % 16) == 0)
|
|
printf("%3d ", i);
|
|
if (xx && isFPLsbs(i))
|
|
printf("xx ");
|
|
else
|
|
printf("%02x ", buf[i]);
|
|
if (i > 0 && ((i % 16) == 15))
|
|
printf("\n");
|
|
}
|
|
}
|
|
|
|
|
|
int main ( int argc, char** argv )
|
|
{
|
|
unsigned char* buf1 = memalign16(512);
|
|
unsigned char* buf2 = memalign16(512);
|
|
unsigned char* buf3 = memalign16(512);
|
|
int xx = argc > 1;
|
|
printf("Re-run with any arg to suppress least-significant\n"
|
|
" 16 bits of FP numbers\n");
|
|
|
|
printf("\n-------- FXSAVE non-64 (REX.W == 0) --------\n");
|
|
|
|
memset(buf1, 0x55, 512);
|
|
memset(buf2, 0x55, 512);
|
|
memset(buf3, 0x55, 512);
|
|
|
|
/* Load up x87/xmm state and dump it. */
|
|
do_setup_then_fxsave(buf1, 0);
|
|
printf("\nBEFORE\n");
|
|
show(buf1, xx);
|
|
|
|
/* Zeroise x87/xmm state and dump it, to show that the
|
|
regs have been cleared out. */
|
|
do_zeroise();
|
|
do_fxsave(buf2, 0);
|
|
printf("\nZEROED\n");
|
|
show(buf2, xx);
|
|
|
|
/* Reload x87/xmm state from buf1 and dump it in buf3. */
|
|
do_fxrstor(buf1, 0);
|
|
do_fxsave(buf3, 0);
|
|
printf("\nRESTORED\n");
|
|
show(buf3, xx);
|
|
|
|
printf("\n-------- FXSAVE 64 (REX.W == 1) --------\n\n");
|
|
|
|
memset(buf1, 0x55, 512);
|
|
memset(buf2, 0x55, 512);
|
|
memset(buf3, 0x55, 512);
|
|
|
|
/* Load up x87/xmm state and dump it. */
|
|
do_setup_then_fxsave(buf1, 1);
|
|
printf("\nBEFORE\n");
|
|
show(buf1, xx);
|
|
|
|
/* Zeroise x87/xmm state and dump it, to show that the
|
|
regs have been cleared out. */
|
|
do_zeroise();
|
|
do_fxsave(buf2, 1);
|
|
printf("\nZEROED\n");
|
|
show(buf2, xx);
|
|
|
|
/* Reload x87/xmm state from buf1 and dump it in buf3. */
|
|
do_fxrstor(buf1, 1);
|
|
do_fxsave(buf3, 1);
|
|
printf("\nRESTORED\n");
|
|
show(buf3, xx);
|
|
|
|
|
|
free(buf1); free(buf2); free(buf3);
|
|
|
|
return 0;
|
|
}
|