comparison run/a/asm_pavgw_01_A.d @ 1285:229e630d4b1a

partuial inline asm review
author thomask
date Tue, 26 Dec 2006 14:21:37 +0000
parents f9084d3862e8
children
comparison
equal deleted inserted replaced
1284:96e7be832c35 1285:229e630d4b1a
14 import addon.cpuinfo; 14 import addon.cpuinfo;
15 15
16 int main(){ 16 int main(){
17 haveSSE!()(); 17 haveSSE!()();
18 18
19 short[] a = new short[8]; 19 short* a = (new short[8]).ptr;
20 a[0] = 1; 20 a[0] = 1;
21 a[1] = -2; 21 a[1] = 2;
22 a[2] = 3; 22 a[2] = 3;
23 a[3] = 4; 23 a[3] = 4;
24 a[4] = 5; 24 a[4] = 5;
25 a[5] = 6; 25 a[5] = 6;
26 a[6] = 7; 26 a[6] = 7;
27 a[7] = 8; 27 a[7] = 8;
28 28
29 short[] b = new short[8]; 29 ushort* b = (new ushort[8]).ptr;
30 b[0] = 5; 30 b[0] = 5;
31 b[1] = 2; 31 b[1] = 2;
32 b[2] = -1; 32 b[2] = 1;
33 b[3] = -8; 33 b[3] = 8;
34 b[4] = 15; 34 b[4] = 15;
35 b[5] = 4; 35 b[5] = 4;
36 b[6] = 1; 36 b[6] = 1;
37 b[7] = 4; 37 b[7] = 4;
38 38
39 short[] c = new short[8]; 39 ushort[] c = new ushort[8];
40 c[0] = 3; 40 c[0] = 3;
41 c[1] = 0; 41 c[1] = 2;
42 c[2] = 1; 42 c[2] = 2;
43 c[3] = -2; 43 c[3] = 6;
44 c[4] = 10; 44 c[4] = 10;
45 c[5] = 5; 45 c[5] = 5;
46 c[6] = 4; 46 c[6] = 4;
47 c[7] = 6; 47 c[7] = 6;
48 48
49 byte[] d = new byte[8]; 49 ushort* d = (new ushort[8]).ptr;
50 50
51 asm{ 51 static if(size_t.sizeof == 4){
52 movdqu XMM0, a; 52 asm{
53 movdqu XMM1, b; 53 mov EAX, a;
54 pavgw XMM0, XMM1; 54 movdqu XMM0, [EAX];
55 movdqu d, XMM0; 55 mov EAX, b;
56 movdqu XMM1, [EAX];
57 pavgw XMM0, XMM1;
58 mov EAX, d;
59 movdqu [EAX], XMM0;
60 }
61 }else static if(size_t.sizeof == 8){
62 asm{
63 mov RAX, a;
64 movdqu XMM0, [RAX];
65 mov RAX, b;
66 movdqu XMM1, [RAX];
67 pavgw XMM0, XMM1;
68 mov RAX, d;
69 movdqu [RAX], XMM0;
70 }
71 }else{
72 static assert(0, "unhandled pointer size");
56 } 73 }
57 74
58 for(size_t i = 0; i < c.length; i++){ 75 for(size_t i = 0; i < c.length; i++){
59 if(d[i] != c[i]){ 76 if(d[i] != c[i]){
60 assert(0); 77 assert(0);