976
|
1 // $HeadURL$
|
|
2 // $Date$
|
|
3 // $Author$
|
|
4
|
|
5 module dstress.run.a.asm_addss_01_A;
|
|
6
|
987
|
7 version(D_InlineAsm_X86){
|
989
|
8 version = runTest;
|
987
|
9 }else version(D_InlineAsm_X86_64){
|
989
|
10 version = runTest;
|
987
|
11 }
|
|
12
|
1063
|
13 version(runTest){
|
|
14 import addon.cpuinfo;
|
1091
|
15
|
1063
|
16 int main(){
|
|
17 haveSSE!()();
|
1091
|
18
|
1264
|
19 float* a = (new float[4]).ptr;
|
1063
|
20 a[0] = 1.0f;
|
|
21 a[1] = 20.0f;
|
|
22 a[2] = 0.4f;
|
|
23 a[3] = 2.0f;
|
1091
|
24
|
1264
|
25 float* b = (new float[4]).ptr;
|
1063
|
26 b[0] = 4.0f;
|
|
27 b[1] = 10.0f;
|
|
28 b[2] = -4.0f;
|
|
29 b[3] = -0.4f;
|
976
|
30
|
1151
|
31 static if(size_t.sizeof == 4){
|
|
32 asm{
|
|
33 mov EAX, a;
|
|
34 movups XMM0, [EAX];
|
|
35 mov EAX, b;
|
|
36 movups XMM1, [EAX];
|
|
37 addss XMM0, XMM1;
|
|
38 movups [EAX], XMM0;
|
|
39 }
|
|
40 }else static if(size_t.sizeof == 8){
|
|
41 asm{
|
|
42 mov RAX, a;
|
|
43 movups XMM0, [RAX];
|
|
44 mov RAX, b;
|
|
45 movups XMM1, [RAX];
|
|
46 addss XMM0, XMM1;
|
|
47 movups [RAX], XMM0;
|
|
48 }
|
|
49 }else{
|
|
50 static assert(0, "unhandled pointer size");
|
976
|
51 }
|
|
52
|
1063
|
53 b[0] -= 5.0f;
|
|
54 if(b[0] < 0.0){
|
|
55 b[0] = -b[0];
|
976
|
56 }
|
|
57
|
1063
|
58 if(b[0] > float.epsilon * 16){
|
976
|
59 assert(0);
|
|
60 }
|
|
61
|
1063
|
62 b[1] -= 20.0f;
|
|
63 if(b[1] < 0.0){
|
|
64 b[1] = -b[1];
|
976
|
65 }
|
|
66
|
1063
|
67 if(b[1] > float.epsilon * 16){
|
976
|
68 assert(0);
|
|
69 }
|
|
70
|
1063
|
71 b[2] -= 0.4f;
|
|
72 if(b[2] < 0.0){
|
|
73 b[2] = -b[2];
|
976
|
74 }
|
|
75
|
1063
|
76 if(b[2] > float.epsilon * 16){
|
976
|
77 assert(0);
|
|
78 }
|
|
79
|
1063
|
80 b[3] -= 2.0f;
|
|
81 if(b[3] < 0.0){
|
|
82 b[3] = -b[3];
|
976
|
83 }
|
|
84
|
1063
|
85 if(b[3] > float.epsilon * 16){
|
976
|
86 assert(0);
|
|
87 }
|
|
88 return 0;
|
|
89 }
|
1063
|
90 }else{
|
1386
|
91 pragma(msg, "DSTRESS{XFAIL}: no inline ASM support");
|
1063
|
92 static assert(0);
|
976
|
93 }
|