1 // Copyright 2016 The SwiftShader Authors. All Rights Reserved.
2 //
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
6 //
7 //    http://www.apache.org/licenses/LICENSE-2.0
8 //
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
14 
15 #include "Nucleus.hpp"
16 
17 namespace sw
18 {
19 	namespace x86
20 	{
21 		RValue<Int> cvtss2si(RValue<Float> val);
22 		RValue<Int2> cvtps2pi(RValue<Float4> val);
23 		RValue<Int2> cvttps2pi(RValue<Float4> val);
24 		RValue<Int4> cvtps2dq(RValue<Float4> val);
25 
26 		RValue<Float> rcpss(RValue<Float> val);
27 		RValue<Float> sqrtss(RValue<Float> val);
28 		RValue<Float> rsqrtss(RValue<Float> val);
29 
30 		RValue<Float4> rcpps(RValue<Float4> val);
31 		RValue<Float4> sqrtps(RValue<Float4> val);
32 		RValue<Float4> rsqrtps(RValue<Float4> val);
33 		RValue<Float4> maxps(RValue<Float4> x, RValue<Float4> y);
34 		RValue<Float4> minps(RValue<Float4> x, RValue<Float4> y);
35 
36 		RValue<Float> roundss(RValue<Float> val, unsigned char imm);
37 		RValue<Float> floorss(RValue<Float> val);
38 		RValue<Float> ceilss(RValue<Float> val);
39 
40 		RValue<Float4> roundps(RValue<Float4> val, unsigned char imm);
41 		RValue<Float4> floorps(RValue<Float4> val);
42 		RValue<Float4> ceilps(RValue<Float4> val);
43 
44 		RValue<Float4> cmpps(RValue<Float4> x, RValue<Float4> y, unsigned char imm);
45 		RValue<Float4> cmpeqps(RValue<Float4> x, RValue<Float4> y);
46 		RValue<Float4> cmpltps(RValue<Float4> x, RValue<Float4> y);
47 		RValue<Float4> cmpleps(RValue<Float4> x, RValue<Float4> y);
48 		RValue<Float4> cmpunordps(RValue<Float4> x, RValue<Float4> y);
49 		RValue<Float4> cmpneqps(RValue<Float4> x, RValue<Float4> y);
50 		RValue<Float4> cmpnltps(RValue<Float4> x, RValue<Float4> y);
51 		RValue<Float4> cmpnleps(RValue<Float4> x, RValue<Float4> y);
52 		RValue<Float4> cmpordps(RValue<Float4> x, RValue<Float4> y);
53 
54 		RValue<Float> cmpss(RValue<Float> x, RValue<Float> y, unsigned char imm);
55 		RValue<Float> cmpeqss(RValue<Float> x, RValue<Float> y);
56 		RValue<Float> cmpltss(RValue<Float> x, RValue<Float> y);
57 		RValue<Float> cmpless(RValue<Float> x, RValue<Float> y);
58 		RValue<Float> cmpunordss(RValue<Float> x, RValue<Float> y);
59 		RValue<Float> cmpneqss(RValue<Float> x, RValue<Float> y);
60 		RValue<Float> cmpnltss(RValue<Float> x, RValue<Float> y);
61 		RValue<Float> cmpnless(RValue<Float> x, RValue<Float> y);
62 		RValue<Float> cmpordss(RValue<Float> x, RValue<Float> y);
63 
64 		RValue<Int4> pabsd(RValue<Int4> x);
65 
66 		RValue<Short4> paddsw(RValue<Short4> x, RValue<Short4> y);
67 		RValue<Short4> psubsw(RValue<Short4> x, RValue<Short4> y);
68 		RValue<UShort4> paddusw(RValue<UShort4> x, RValue<UShort4> y);
69 		RValue<UShort4> psubusw(RValue<UShort4> x, RValue<UShort4> y);
70 		RValue<SByte8> paddsb(RValue<SByte8> x, RValue<SByte8> y);
71 		RValue<SByte8> psubsb(RValue<SByte8> x, RValue<SByte8> y);
72 		RValue<Byte8> paddusb(RValue<Byte8> x, RValue<Byte8> y);
73 		RValue<Byte8> psubusb(RValue<Byte8> x, RValue<Byte8> y);
74 
75 		RValue<Short4> paddw(RValue<Short4> x, RValue<Short4> y);
76 		RValue<Short4> psubw(RValue<Short4> x, RValue<Short4> y);
77 		RValue<Short4> pmullw(RValue<Short4> x, RValue<Short4> y);
78 		RValue<Short4> pand(RValue<Short4> x, RValue<Short4> y);
79 		RValue<Short4> por(RValue<Short4> x, RValue<Short4> y);
80 		RValue<Short4> pxor(RValue<Short4> x, RValue<Short4> y);
81 		RValue<Short4> pshufw(RValue<Short4> x, unsigned char y);
82 		RValue<Int2> punpcklwd(RValue<Short4> x, RValue<Short4> y);
83 		RValue<Int2> punpckhwd(RValue<Short4> x, RValue<Short4> y);
84 		RValue<Short4> pinsrw(RValue<Short4> x, RValue<Int> y, unsigned int i);
85 		RValue<Int> pextrw(RValue<Short4> x, unsigned int i);
86 		RValue<Long1> punpckldq(RValue<Int2> x, RValue<Int2> y);
87 		RValue<Long1> punpckhdq(RValue<Int2> x, RValue<Int2> y);
88 		RValue<Short4> punpcklbw(RValue<Byte8> x, RValue<Byte8> y);
89 		RValue<Short4> punpckhbw(RValue<Byte8> x, RValue<Byte8> y);
90 		RValue<Byte8> paddb(RValue<Byte8> x, RValue<Byte8> y);
91 		RValue<Byte8> psubb(RValue<Byte8> x, RValue<Byte8> y);
92 		RValue<Int2> paddd(RValue<Int2> x, RValue<Int2> y);
93 		RValue<Int2> psubd(RValue<Int2> x, RValue<Int2> y);
94 
95 		RValue<UShort4> pavgw(RValue<UShort4> x, RValue<UShort4> y);
96 
97 		RValue<Short4> pmaxsw(RValue<Short4> x, RValue<Short4> y);
98 		RValue<Short4> pminsw(RValue<Short4> x, RValue<Short4> y);
99 
100 		RValue<Short4> pcmpgtw(RValue<Short4> x, RValue<Short4> y);
101 		RValue<Short4> pcmpeqw(RValue<Short4> x, RValue<Short4> y);
102 		RValue<Byte8> pcmpgtb(RValue<SByte8> x, RValue<SByte8> y);
103 		RValue<Byte8> pcmpeqb(RValue<Byte8> x, RValue<Byte8> y);
104 
105 		RValue<Short4> packssdw(RValue<Int2> x, RValue<Int2> y);
106 		RValue<Short8> packssdw(RValue<Int4> x, RValue<Int4> y);
107 		RValue<SByte8> packsswb(RValue<Short4> x, RValue<Short4> y);
108 		RValue<Byte8> packuswb(RValue<UShort4> x, RValue<UShort4> y);
109 
110 		RValue<UShort8> packusdw(RValue<UInt4> x, RValue<UInt4> y);
111 
112 		RValue<UShort4> psrlw(RValue<UShort4> x, unsigned char y);
113 		RValue<UShort8> psrlw(RValue<UShort8> x, unsigned char y);
114 		RValue<Short4> psraw(RValue<Short4> x, unsigned char y);
115 		RValue<Short8> psraw(RValue<Short8> x, unsigned char y);
116 		RValue<Short4> psllw(RValue<Short4> x, unsigned char y);
117 		RValue<Short8> psllw(RValue<Short8> x, unsigned char y);
118 		RValue<Int2> pslld(RValue<Int2> x, unsigned char y);
119 		RValue<Int4> pslld(RValue<Int4> x, unsigned char y);
120 		RValue<Int2> psrad(RValue<Int2> x, unsigned char y);
121 		RValue<Int4> psrad(RValue<Int4> x, unsigned char y);
122 		RValue<UInt2> psrld(RValue<UInt2> x, unsigned char y);
123 		RValue<UInt4> psrld(RValue<UInt4> x, unsigned char y);
124 
125 		RValue<UShort4> psrlw(RValue<UShort4> x, RValue<Long1> y);
126 		RValue<Short4> psraw(RValue<Short4> x, RValue<Long1> y);
127 		RValue<Short4> psllw(RValue<Short4> x, RValue<Long1> y);
128 		RValue<Int2> pslld(RValue<Int2> x, RValue<Long1> y);
129 		RValue<UInt2> psrld(RValue<UInt2> x, RValue<Long1> y);
130 		RValue<Int2> psrad(RValue<Int2> x, RValue<Long1> y);
131 
132 		RValue<Int4> pmaxsd(RValue<Int4> x, RValue<Int4> y);
133 		RValue<Int4> pminsd(RValue<Int4> x, RValue<Int4> y);
134 		RValue<UInt4> pmaxud(RValue<UInt4> x, RValue<UInt4> y);
135 		RValue<UInt4> pminud(RValue<UInt4> x, RValue<UInt4> y);
136 
137 		RValue<Short4> pmulhw(RValue<Short4> x, RValue<Short4> y);
138 		RValue<UShort4> pmulhuw(RValue<UShort4> x, RValue<UShort4> y);
139 		RValue<Int2> pmaddwd(RValue<Short4> x, RValue<Short4> y);
140 
141 		RValue<Short8> pmulhw(RValue<Short8> x, RValue<Short8> y);
142 		RValue<UShort8> pmulhuw(RValue<UShort8> x, RValue<UShort8> y);
143 		RValue<Int4> pmaddwd(RValue<Short8> x, RValue<Short8> y);
144 
145 		RValue<Int> movmskps(RValue<Float4> x);
146 		RValue<Int> pmovmskb(RValue<Byte8> x);
147 
148 		RValue<Int4> pmovzxbd(RValue<Int4> x);
149 		RValue<Int4> pmovsxbd(RValue<Int4> x);
150 		RValue<Int4> pmovzxwd(RValue<Int4> x);
151 		RValue<Int4> pmovsxwd(RValue<Int4> x);
152 
153 		void emms();
154 	}
155 }
156