1 // Copyright 2016 The SwiftShader Authors. All Rights Reserved. 2 // 3 // Licensed under the Apache License, Version 2.0 (the "License"); 4 // you may not use this file except in compliance with the License. 5 // You may obtain a copy of the License at 6 // 7 // http://www.apache.org/licenses/LICENSE-2.0 8 // 9 // Unless required by applicable law or agreed to in writing, software 10 // distributed under the License is distributed on an "AS IS" BASIS, 11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 12 // See the License for the specific language governing permissions and 13 // limitations under the License. 14 15 #include "Nucleus.hpp" 16 17 namespace sw 18 { 19 namespace x86 20 { 21 RValue<Int> cvtss2si(RValue<Float> val); 22 RValue<Int2> cvtps2pi(RValue<Float4> val); 23 RValue<Int2> cvttps2pi(RValue<Float4> val); 24 RValue<Int4> cvtps2dq(RValue<Float4> val); 25 26 RValue<Float> rcpss(RValue<Float> val); 27 RValue<Float> sqrtss(RValue<Float> val); 28 RValue<Float> rsqrtss(RValue<Float> val); 29 30 RValue<Float4> rcpps(RValue<Float4> val); 31 RValue<Float4> sqrtps(RValue<Float4> val); 32 RValue<Float4> rsqrtps(RValue<Float4> val); 33 RValue<Float4> maxps(RValue<Float4> x, RValue<Float4> y); 34 RValue<Float4> minps(RValue<Float4> x, RValue<Float4> y); 35 36 RValue<Float> roundss(RValue<Float> val, unsigned char imm); 37 RValue<Float> floorss(RValue<Float> val); 38 RValue<Float> ceilss(RValue<Float> val); 39 40 RValue<Float4> roundps(RValue<Float4> val, unsigned char imm); 41 RValue<Float4> floorps(RValue<Float4> val); 42 RValue<Float4> ceilps(RValue<Float4> val); 43 44 RValue<Float4> cmpps(RValue<Float4> x, RValue<Float4> y, unsigned char imm); 45 RValue<Float4> cmpeqps(RValue<Float4> x, RValue<Float4> y); 46 RValue<Float4> cmpltps(RValue<Float4> x, RValue<Float4> y); 47 RValue<Float4> cmpleps(RValue<Float4> x, RValue<Float4> y); 48 RValue<Float4> cmpunordps(RValue<Float4> x, RValue<Float4> y); 49 RValue<Float4> cmpneqps(RValue<Float4> x, RValue<Float4> y); 50 RValue<Float4> cmpnltps(RValue<Float4> x, RValue<Float4> y); 51 RValue<Float4> cmpnleps(RValue<Float4> x, RValue<Float4> y); 52 RValue<Float4> cmpordps(RValue<Float4> x, RValue<Float4> y); 53 54 RValue<Float> cmpss(RValue<Float> x, RValue<Float> y, unsigned char imm); 55 RValue<Float> cmpeqss(RValue<Float> x, RValue<Float> y); 56 RValue<Float> cmpltss(RValue<Float> x, RValue<Float> y); 57 RValue<Float> cmpless(RValue<Float> x, RValue<Float> y); 58 RValue<Float> cmpunordss(RValue<Float> x, RValue<Float> y); 59 RValue<Float> cmpneqss(RValue<Float> x, RValue<Float> y); 60 RValue<Float> cmpnltss(RValue<Float> x, RValue<Float> y); 61 RValue<Float> cmpnless(RValue<Float> x, RValue<Float> y); 62 RValue<Float> cmpordss(RValue<Float> x, RValue<Float> y); 63 64 RValue<Int4> pabsd(RValue<Int4> x); 65 66 RValue<Short4> paddsw(RValue<Short4> x, RValue<Short4> y); 67 RValue<Short4> psubsw(RValue<Short4> x, RValue<Short4> y); 68 RValue<UShort4> paddusw(RValue<UShort4> x, RValue<UShort4> y); 69 RValue<UShort4> psubusw(RValue<UShort4> x, RValue<UShort4> y); 70 RValue<SByte8> paddsb(RValue<SByte8> x, RValue<SByte8> y); 71 RValue<SByte8> psubsb(RValue<SByte8> x, RValue<SByte8> y); 72 RValue<Byte8> paddusb(RValue<Byte8> x, RValue<Byte8> y); 73 RValue<Byte8> psubusb(RValue<Byte8> x, RValue<Byte8> y); 74 75 RValue<Short4> paddw(RValue<Short4> x, RValue<Short4> y); 76 RValue<Short4> psubw(RValue<Short4> x, RValue<Short4> y); 77 RValue<Short4> pmullw(RValue<Short4> x, RValue<Short4> y); 78 RValue<Short4> pand(RValue<Short4> x, RValue<Short4> y); 79 RValue<Short4> por(RValue<Short4> x, RValue<Short4> y); 80 RValue<Short4> pxor(RValue<Short4> x, RValue<Short4> y); 81 RValue<Short4> pshufw(RValue<Short4> x, unsigned char y); 82 RValue<Int2> punpcklwd(RValue<Short4> x, RValue<Short4> y); 83 RValue<Int2> punpckhwd(RValue<Short4> x, RValue<Short4> y); 84 RValue<Short4> pinsrw(RValue<Short4> x, RValue<Int> y, unsigned int i); 85 RValue<Int> pextrw(RValue<Short4> x, unsigned int i); 86 RValue<Long1> punpckldq(RValue<Int2> x, RValue<Int2> y); 87 RValue<Long1> punpckhdq(RValue<Int2> x, RValue<Int2> y); 88 RValue<Short4> punpcklbw(RValue<Byte8> x, RValue<Byte8> y); 89 RValue<Short4> punpckhbw(RValue<Byte8> x, RValue<Byte8> y); 90 RValue<Byte8> paddb(RValue<Byte8> x, RValue<Byte8> y); 91 RValue<Byte8> psubb(RValue<Byte8> x, RValue<Byte8> y); 92 RValue<Int2> paddd(RValue<Int2> x, RValue<Int2> y); 93 RValue<Int2> psubd(RValue<Int2> x, RValue<Int2> y); 94 95 RValue<UShort4> pavgw(RValue<UShort4> x, RValue<UShort4> y); 96 97 RValue<Short4> pmaxsw(RValue<Short4> x, RValue<Short4> y); 98 RValue<Short4> pminsw(RValue<Short4> x, RValue<Short4> y); 99 100 RValue<Short4> pcmpgtw(RValue<Short4> x, RValue<Short4> y); 101 RValue<Short4> pcmpeqw(RValue<Short4> x, RValue<Short4> y); 102 RValue<Byte8> pcmpgtb(RValue<SByte8> x, RValue<SByte8> y); 103 RValue<Byte8> pcmpeqb(RValue<Byte8> x, RValue<Byte8> y); 104 105 RValue<Short4> packssdw(RValue<Int2> x, RValue<Int2> y); 106 RValue<Short8> packssdw(RValue<Int4> x, RValue<Int4> y); 107 RValue<SByte8> packsswb(RValue<Short4> x, RValue<Short4> y); 108 RValue<Byte8> packuswb(RValue<UShort4> x, RValue<UShort4> y); 109 110 RValue<UShort8> packusdw(RValue<UInt4> x, RValue<UInt4> y); 111 112 RValue<UShort4> psrlw(RValue<UShort4> x, unsigned char y); 113 RValue<UShort8> psrlw(RValue<UShort8> x, unsigned char y); 114 RValue<Short4> psraw(RValue<Short4> x, unsigned char y); 115 RValue<Short8> psraw(RValue<Short8> x, unsigned char y); 116 RValue<Short4> psllw(RValue<Short4> x, unsigned char y); 117 RValue<Short8> psllw(RValue<Short8> x, unsigned char y); 118 RValue<Int2> pslld(RValue<Int2> x, unsigned char y); 119 RValue<Int4> pslld(RValue<Int4> x, unsigned char y); 120 RValue<Int2> psrad(RValue<Int2> x, unsigned char y); 121 RValue<Int4> psrad(RValue<Int4> x, unsigned char y); 122 RValue<UInt2> psrld(RValue<UInt2> x, unsigned char y); 123 RValue<UInt4> psrld(RValue<UInt4> x, unsigned char y); 124 125 RValue<UShort4> psrlw(RValue<UShort4> x, RValue<Long1> y); 126 RValue<Short4> psraw(RValue<Short4> x, RValue<Long1> y); 127 RValue<Short4> psllw(RValue<Short4> x, RValue<Long1> y); 128 RValue<Int2> pslld(RValue<Int2> x, RValue<Long1> y); 129 RValue<UInt2> psrld(RValue<UInt2> x, RValue<Long1> y); 130 RValue<Int2> psrad(RValue<Int2> x, RValue<Long1> y); 131 132 RValue<Int4> pmaxsd(RValue<Int4> x, RValue<Int4> y); 133 RValue<Int4> pminsd(RValue<Int4> x, RValue<Int4> y); 134 RValue<UInt4> pmaxud(RValue<UInt4> x, RValue<UInt4> y); 135 RValue<UInt4> pminud(RValue<UInt4> x, RValue<UInt4> y); 136 137 RValue<Short4> pmulhw(RValue<Short4> x, RValue<Short4> y); 138 RValue<UShort4> pmulhuw(RValue<UShort4> x, RValue<UShort4> y); 139 RValue<Int2> pmaddwd(RValue<Short4> x, RValue<Short4> y); 140 141 RValue<Short8> pmulhw(RValue<Short8> x, RValue<Short8> y); 142 RValue<UShort8> pmulhuw(RValue<UShort8> x, RValue<UShort8> y); 143 RValue<Int4> pmaddwd(RValue<Short8> x, RValue<Short8> y); 144 145 RValue<Int> movmskps(RValue<Float4> x); 146 RValue<Int> pmovmskb(RValue<Byte8> x); 147 148 RValue<Int4> pmovzxbd(RValue<Int4> x); 149 RValue<Int4> pmovsxbd(RValue<Int4> x); 150 RValue<Int4> pmovzxwd(RValue<Int4> x); 151 RValue<Int4> pmovsxwd(RValue<Int4> x); 152 153 void emms(); 154 } 155 } 156