1 // Copyright 2011 the V8 project authors. All rights reserved.
2 // Redistribution and use in source and binary forms, with or without
3 // modification, are permitted provided that the following conditions are
4 // met:
5 //
6 //     * Redistributions of source code must retain the above copyright
7 //       notice, this list of conditions and the following disclaimer.
8 //     * Redistributions in binary form must reproduce the above
9 //       copyright notice, this list of conditions and the following
10 //       disclaimer in the documentation and/or other materials provided
11 //       with the distribution.
12 //     * Neither the name of Google Inc. nor the names of its
13 //       contributors may be used to endorse or promote products derived
14 //       from this software without specific prior written permission.
15 //
16 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
17 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
18 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
19 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
20 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27 
28 #include <stdlib.h>
29 
30 #include "src/v8.h"
31 
32 #include "src/debug/debug.h"
33 #include "src/disasm.h"
34 #include "src/disassembler.h"
35 #include "src/ic/ic.h"
36 #include "src/macro-assembler.h"
37 #include "test/cctest/cctest.h"
38 
39 using namespace v8::internal;
40 
41 
42 #define __ assm.
43 
44 
DummyStaticFunction(Object * result)45 static void DummyStaticFunction(Object* result) {
46 }
47 
48 
TEST(DisasmX64)49 TEST(DisasmX64) {
50   CcTest::InitializeVM();
51   Isolate* isolate = CcTest::i_isolate();
52   HandleScope scope(isolate);
53   v8::internal::byte buffer[4096];
54   Assembler assm(isolate, buffer, sizeof buffer);
55   DummyStaticFunction(NULL);  // just bloody use it (DELETE; debugging)
56 
57   // Short immediate instructions
58   __ addq(rax, Immediate(12345678));
59   __ orq(rax, Immediate(12345678));
60   __ subq(rax, Immediate(12345678));
61   __ xorq(rax, Immediate(12345678));
62   __ andq(rax, Immediate(12345678));
63 
64   // ---- This one caused crash
65   __ movq(rbx,  Operand(rsp, rcx, times_2, 0));  // [rsp+rcx*4]
66 
67   // ---- All instructions that I can think of
68   __ addq(rdx, rbx);
69   __ addq(rdx, Operand(rbx, 0));
70   __ addq(rdx, Operand(rbx, 16));
71   __ addq(rdx, Operand(rbx, 1999));
72   __ addq(rdx, Operand(rbx, -4));
73   __ addq(rdx, Operand(rbx, -1999));
74   __ addq(rdx, Operand(rsp, 0));
75   __ addq(rdx, Operand(rsp, 16));
76   __ addq(rdx, Operand(rsp, 1999));
77   __ addq(rdx, Operand(rsp, -4));
78   __ addq(rdx, Operand(rsp, -1999));
79   __ nop();
80   __ addq(rsi, Operand(rcx, times_4, 0));
81   __ addq(rsi, Operand(rcx, times_4, 24));
82   __ addq(rsi, Operand(rcx, times_4, -4));
83   __ addq(rsi, Operand(rcx, times_4, -1999));
84   __ nop();
85   __ addq(rdi, Operand(rbp, rcx, times_4, 0));
86   __ addq(rdi, Operand(rbp, rcx, times_4, 12));
87   __ addq(rdi, Operand(rbp, rcx, times_4, -8));
88   __ addq(rdi, Operand(rbp, rcx, times_4, -3999));
89   __ addq(Operand(rbp, rcx, times_4, 12), Immediate(12));
90 
91   __ bsrl(rax, r15);
92   __ bsrl(r9, Operand(rcx, times_8, 91919));
93 
94   __ nop();
95   __ addq(rbx, Immediate(12));
96   __ nop();
97   __ nop();
98   __ andq(rdx, Immediate(3));
99   __ andq(rdx, Operand(rsp, 4));
100   __ cmpq(rdx, Immediate(3));
101   __ cmpq(rdx, Operand(rsp, 4));
102   __ cmpq(Operand(rbp, rcx, times_4, 0), Immediate(1000));
103   __ cmpb(rbx, Operand(rbp, rcx, times_2, 0));
104   __ cmpb(Operand(rbp, rcx, times_2, 0), rbx);
105   __ orq(rdx, Immediate(3));
106   __ xorq(rdx, Immediate(3));
107   __ nop();
108   __ cpuid();
109   __ movsxbl(rdx, Operand(rcx, 0));
110   __ movsxbq(rdx, Operand(rcx, 0));
111   __ movsxwl(rdx, Operand(rcx, 0));
112   __ movsxwq(rdx, Operand(rcx, 0));
113   __ movzxbl(rdx, Operand(rcx, 0));
114   __ movzxwl(rdx, Operand(rcx, 0));
115   __ movzxbq(rdx, Operand(rcx, 0));
116   __ movzxwq(rdx, Operand(rcx, 0));
117 
118   __ nop();
119   __ imulq(rdx, rcx);
120   __ shld(rdx, rcx);
121   __ shrd(rdx, rcx);
122   __ shlq(Operand(rdi, rax, times_4, 100), Immediate(1));
123   __ shlq(Operand(rdi, rax, times_4, 100), Immediate(6));
124   __ shlq(Operand(r15, 0), Immediate(1));
125   __ shlq(Operand(r15, 0), Immediate(6));
126   __ shlq_cl(Operand(r15, 0));
127   __ shlq_cl(Operand(r15, 0));
128   __ shlq_cl(Operand(rdi, rax, times_4, 100));
129   __ shlq_cl(Operand(rdi, rax, times_4, 100));
130   __ shlq(rdx, Immediate(1));
131   __ shlq(rdx, Immediate(6));
132   __ shll(Operand(rdi, rax, times_4, 100), Immediate(1));
133   __ shll(Operand(rdi, rax, times_4, 100), Immediate(6));
134   __ shll(Operand(r15, 0), Immediate(1));
135   __ shll(Operand(r15, 0), Immediate(6));
136   __ shll_cl(Operand(r15, 0));
137   __ shll_cl(Operand(r15, 0));
138   __ shll_cl(Operand(rdi, rax, times_4, 100));
139   __ shll_cl(Operand(rdi, rax, times_4, 100));
140   __ shll(rdx, Immediate(1));
141   __ shll(rdx, Immediate(6));
142   __ bts(Operand(rdx, 0), rcx);
143   __ bts(Operand(rbx, rcx, times_4, 0), rcx);
144   __ nop();
145   __ pushq(Immediate(12));
146   __ pushq(Immediate(23456));
147   __ pushq(rcx);
148   __ pushq(rsi);
149   __ pushq(Operand(rbp, JavaScriptFrameConstants::kFunctionOffset));
150   __ pushq(Operand(rbx, rcx, times_4, 0));
151   __ pushq(Operand(rbx, rcx, times_4, 0));
152   __ pushq(Operand(rbx, rcx, times_4, 10000));
153   __ popq(rdx);
154   __ popq(rax);
155   __ popq(Operand(rbx, rcx, times_4, 0));
156   __ nop();
157 
158   __ addq(rdx, Operand(rsp, 16));
159   __ addq(rdx, rcx);
160   __ movb(rdx, Operand(rcx, 0));
161   __ movb(rcx, Immediate(6));
162   __ movb(Operand(rsp, 16), rdx);
163   __ movw(Operand(rsp, 16), rdx);
164   __ nop();
165   __ movsxwq(rdx, Operand(rsp, 12));
166   __ movsxbq(rdx, Operand(rsp, 12));
167   __ movsxlq(rdx, Operand(rsp, 12));
168   __ movzxwq(rdx, Operand(rsp, 12));
169   __ movzxbq(rdx, Operand(rsp, 12));
170   __ nop();
171   __ movq(rdx, Immediate(1234567));
172   __ movq(rdx, Operand(rsp, 12));
173   __ movq(Operand(rbx, rcx, times_4, 10000), Immediate(12345));
174   __ movq(Operand(rbx, rcx, times_4, 10000), rdx);
175   __ nop();
176   __ decb(rdx);
177   __ decb(Operand(rax, 10));
178   __ decb(Operand(rbx, rcx, times_4, 10000));
179   __ decq(rdx);
180   __ cdq();
181 
182   __ nop();
183   __ idivq(rdx);
184   __ mull(rdx);
185   __ mulq(rdx);
186   __ negq(rdx);
187   __ notq(rdx);
188   __ testq(Operand(rbx, rcx, times_4, 10000), rdx);
189 
190   __ imulq(rdx, rcx, Immediate(12));
191   __ imulq(rdx, rcx, Immediate(1000));
192   __ imulq(rdx, Operand(rbx, rcx, times_4, 10000));
193   __ imulq(rdx, Operand(rbx, rcx, times_4, 10000), Immediate(12));
194   __ imulq(rdx, Operand(rbx, rcx, times_4, 10000), Immediate(1000));
195   __ imull(r15, rcx, Immediate(12));
196   __ imull(r15, rcx, Immediate(1000));
197   __ imull(r15, Operand(rbx, rcx, times_4, 10000));
198   __ imull(r15, Operand(rbx, rcx, times_4, 10000), Immediate(12));
199   __ imull(r15, Operand(rbx, rcx, times_4, 10000), Immediate(1000));
200 
201   __ incq(rdx);
202   __ incq(Operand(rbx, rcx, times_4, 10000));
203   __ pushq(Operand(rbx, rcx, times_4, 10000));
204   __ popq(Operand(rbx, rcx, times_4, 10000));
205   // TODO(mstarzinger): The following is protected.
206   // __ jmp(Operand(rbx, rcx, times_4, 10000));
207 
208   __ leaq(rdx, Operand(rbx, rcx, times_4, 10000));
209   __ orq(rdx, Immediate(12345));
210   __ orq(rdx, Operand(rbx, rcx, times_4, 10000));
211 
212   __ nop();
213 
214   __ rclq(rdx, Immediate(1));
215   __ rclq(rdx, Immediate(7));
216   __ rcrq(rdx, Immediate(1));
217   __ rcrq(rdx, Immediate(7));
218   __ sarq(rdx, Immediate(1));
219   __ sarq(rdx, Immediate(6));
220   __ sarq_cl(rdx);
221   __ sbbq(rdx, rbx);
222   __ shld(rdx, rbx);
223   __ shlq(rdx, Immediate(1));
224   __ shlq(rdx, Immediate(6));
225   __ shlq_cl(rdx);
226   __ shrd(rdx, rbx);
227   __ shrq(rdx, Immediate(1));
228   __ shrq(rdx, Immediate(7));
229   __ shrq_cl(rdx);
230 
231 
232   // Immediates
233 
234   __ addq(rbx, Immediate(12));
235   __ addq(Operand(rdx, rcx, times_4, 10000), Immediate(12));
236 
237   __ andq(rbx, Immediate(12345));
238 
239   __ cmpq(rbx, Immediate(12345));
240   __ cmpq(rbx, Immediate(12));
241   __ cmpq(Operand(rdx, rcx, times_4, 10000), Immediate(12));
242   __ cmpb(rax, Immediate(100));
243 
244   __ orq(rbx, Immediate(12345));
245 
246   __ subq(rbx, Immediate(12));
247   __ subq(Operand(rdx, rcx, times_4, 10000), Immediate(12));
248 
249   __ xorq(rbx, Immediate(12345));
250 
251   __ imulq(rdx, rcx, Immediate(12));
252   __ imulq(rdx, rcx, Immediate(1000));
253 
254   __ cld();
255 
256   __ subq(rdx, Operand(rbx, rcx, times_4, 10000));
257   __ subq(rdx, rbx);
258 
259   __ testq(rdx, Immediate(12345));
260   __ testq(Operand(rbx, rcx, times_8, 10000), rdx);
261   __ testb(Operand(rcx, rbx, times_2, 1000), rdx);
262   __ testb(Operand(rax, -20), Immediate(0x9A));
263   __ nop();
264 
265   __ xorq(rdx, Immediate(12345));
266   __ xorq(rdx, Operand(rbx, rcx, times_8, 10000));
267   __ bts(Operand(rbx, rcx, times_8, 10000), rdx);
268   __ hlt();
269   __ int3();
270   __ ret(0);
271   __ ret(8);
272 
273   // Calls
274 
275   Label L1, L2;
276   __ bind(&L1);
277   __ nop();
278   __ call(&L1);
279   __ call(&L2);
280   __ nop();
281   __ bind(&L2);
282   // TODO(mstarzinger): The following is protected.
283   // __ call(Operand(rbx, rcx, times_4, 10000));
284   __ nop();
285   Handle<Code> ic(LoadIC::initialize_stub(isolate, NOT_INSIDE_TYPEOF));
286   __ call(ic, RelocInfo::CODE_TARGET);
287   __ nop();
288   __ nop();
289 
290   __ jmp(&L1);
291   // TODO(mstarzinger): The following is protected.
292   // __ jmp(Operand(rbx, rcx, times_4, 10000));
293   ExternalReference after_break_target =
294       ExternalReference::debug_after_break_target_address(isolate);
295   USE(after_break_target);
296   __ jmp(ic, RelocInfo::CODE_TARGET);
297   __ nop();
298 
299 
300   Label Ljcc;
301   __ nop();
302   // long jumps
303   __ j(overflow, &Ljcc);
304   __ j(no_overflow, &Ljcc);
305   __ j(below, &Ljcc);
306   __ j(above_equal, &Ljcc);
307   __ j(equal, &Ljcc);
308   __ j(not_equal, &Ljcc);
309   __ j(below_equal, &Ljcc);
310   __ j(above, &Ljcc);
311   __ j(sign, &Ljcc);
312   __ j(not_sign, &Ljcc);
313   __ j(parity_even, &Ljcc);
314   __ j(parity_odd, &Ljcc);
315   __ j(less, &Ljcc);
316   __ j(greater_equal, &Ljcc);
317   __ j(less_equal, &Ljcc);
318   __ j(greater, &Ljcc);
319   __ nop();
320   __ bind(&Ljcc);
321   // short jumps
322   __ j(overflow, &Ljcc);
323   __ j(no_overflow, &Ljcc);
324   __ j(below, &Ljcc);
325   __ j(above_equal, &Ljcc);
326   __ j(equal, &Ljcc);
327   __ j(not_equal, &Ljcc);
328   __ j(below_equal, &Ljcc);
329   __ j(above, &Ljcc);
330   __ j(sign, &Ljcc);
331   __ j(not_sign, &Ljcc);
332   __ j(parity_even, &Ljcc);
333   __ j(parity_odd, &Ljcc);
334   __ j(less, &Ljcc);
335   __ j(greater_equal, &Ljcc);
336   __ j(less_equal, &Ljcc);
337   __ j(greater, &Ljcc);
338 
339   // 0xD9 instructions
340   __ nop();
341 
342   __ fld(1);
343   __ fld1();
344   __ fldz();
345   __ fldpi();
346   __ fabs();
347   __ fchs();
348   __ fprem();
349   __ fprem1();
350   __ fincstp();
351   __ ftst();
352   __ fxch(3);
353   __ fld_s(Operand(rbx, rcx, times_4, 10000));
354   __ fstp_s(Operand(rbx, rcx, times_4, 10000));
355   __ ffree(3);
356   __ fld_d(Operand(rbx, rcx, times_4, 10000));
357   __ fstp_d(Operand(rbx, rcx, times_4, 10000));
358   __ nop();
359 
360   __ fild_s(Operand(rbx, rcx, times_4, 10000));
361   __ fistp_s(Operand(rbx, rcx, times_4, 10000));
362   __ fild_d(Operand(rbx, rcx, times_4, 10000));
363   __ fistp_d(Operand(rbx, rcx, times_4, 10000));
364   __ fnstsw_ax();
365   __ nop();
366   __ fadd(3);
367   __ fsub(3);
368   __ fmul(3);
369   __ fdiv(3);
370 
371   __ faddp(3);
372   __ fsubp(3);
373   __ fmulp(3);
374   __ fdivp(3);
375   __ fcompp();
376   __ fwait();
377   __ frndint();
378   __ fninit();
379   __ nop();
380 
381   // SSE instruction
382   {
383     // Move operation
384     __ cvttss2si(rdx, Operand(rbx, rcx, times_4, 10000));
385     __ cvttss2si(rdx, xmm1);
386     __ cvtsd2ss(xmm0, xmm1);
387     __ cvtsd2ss(xmm0, Operand(rbx, rcx, times_4, 10000));
388     __ movaps(xmm0, xmm1);
389 
390     // logic operation
391     __ andps(xmm0, xmm1);
392     __ andps(xmm0, Operand(rbx, rcx, times_4, 10000));
393     __ orps(xmm0, xmm1);
394     __ orps(xmm0, Operand(rbx, rcx, times_4, 10000));
395     __ xorps(xmm0, xmm1);
396     __ xorps(xmm0, Operand(rbx, rcx, times_4, 10000));
397 
398     // Arithmetic operation
399     __ addss(xmm1, xmm0);
400     __ addss(xmm1, Operand(rbx, rcx, times_4, 10000));
401     __ mulss(xmm1, xmm0);
402     __ mulss(xmm1, Operand(rbx, rcx, times_4, 10000));
403     __ subss(xmm1, xmm0);
404     __ subss(xmm1, Operand(rbx, rcx, times_4, 10000));
405     __ divss(xmm1, xmm0);
406     __ divss(xmm1, Operand(rbx, rcx, times_4, 10000));
407     __ maxss(xmm1, xmm0);
408     __ maxss(xmm1, Operand(rbx, rcx, times_4, 10000));
409     __ minss(xmm1, xmm0);
410     __ minss(xmm1, Operand(rbx, rcx, times_4, 10000));
411     __ addps(xmm1, xmm0);
412     __ addps(xmm1, Operand(rbx, rcx, times_4, 10000));
413     __ subps(xmm1, xmm0);
414     __ subps(xmm1, Operand(rbx, rcx, times_4, 10000));
415     __ mulps(xmm1, xmm0);
416     __ mulps(xmm1, Operand(rbx, rcx, times_4, 10000));
417     __ divps(xmm1, xmm0);
418     __ divps(xmm1, Operand(rbx, rcx, times_4, 10000));
419 
420     __ ucomiss(xmm0, xmm1);
421     __ ucomiss(xmm0, Operand(rbx, rcx, times_4, 10000));
422   }
423   // SSE 2 instructions
424   {
425     __ cvttsd2si(rdx, Operand(rbx, rcx, times_4, 10000));
426     __ cvttsd2si(rdx, xmm1);
427     __ cvttsd2siq(rdx, xmm1);
428     __ cvttsd2siq(rdx, Operand(rbx, rcx, times_4, 10000));
429     __ cvtqsi2sd(xmm1, Operand(rbx, rcx, times_4, 10000));
430     __ cvtqsi2sd(xmm1, rdx);
431     __ movsd(xmm1, Operand(rbx, rcx, times_4, 10000));
432     __ movsd(Operand(rbx, rcx, times_4, 10000), xmm1);
433     // 128 bit move instructions.
434     __ movdqa(xmm0, Operand(rbx, rcx, times_4, 10000));
435     __ movdqa(Operand(rbx, rcx, times_4, 10000), xmm0);
436 
437     __ addsd(xmm1, xmm0);
438     __ addsd(xmm1, Operand(rbx, rcx, times_4, 10000));
439     __ mulsd(xmm1, xmm0);
440     __ mulsd(xmm1, Operand(rbx, rcx, times_4, 10000));
441     __ subsd(xmm1, xmm0);
442     __ subsd(xmm1, Operand(rbx, rcx, times_4, 10000));
443     __ divsd(xmm1, xmm0);
444     __ divsd(xmm1, Operand(rbx, rcx, times_4, 10000));
445     __ minsd(xmm1, xmm0);
446     __ minsd(xmm1, Operand(rbx, rcx, times_4, 10000));
447     __ maxsd(xmm1, xmm0);
448     __ maxsd(xmm1, Operand(rbx, rcx, times_4, 10000));
449     __ ucomisd(xmm0, xmm1);
450 
451     __ andpd(xmm0, xmm1);
452 
453     __ pslld(xmm0, 6);
454     __ psrld(xmm0, 6);
455     __ psllq(xmm0, 6);
456     __ psrlq(xmm0, 6);
457 
458     __ pcmpeqd(xmm1, xmm0);
459 
460     __ punpckldq(xmm1, xmm11);
461     __ punpckhdq(xmm8, xmm15);
462   }
463 
464   // cmov.
465   {
466     __ cmovq(overflow, rax, Operand(rax, 0));
467     __ cmovq(no_overflow, rax, Operand(rax, 1));
468     __ cmovq(below, rax, Operand(rax, 2));
469     __ cmovq(above_equal, rax, Operand(rax, 3));
470     __ cmovq(equal, rax, Operand(rbx, 0));
471     __ cmovq(not_equal, rax, Operand(rbx, 1));
472     __ cmovq(below_equal, rax, Operand(rbx, 2));
473     __ cmovq(above, rax, Operand(rbx, 3));
474     __ cmovq(sign, rax, Operand(rcx, 0));
475     __ cmovq(not_sign, rax, Operand(rcx, 1));
476     __ cmovq(parity_even, rax, Operand(rcx, 2));
477     __ cmovq(parity_odd, rax, Operand(rcx, 3));
478     __ cmovq(less, rax, Operand(rdx, 0));
479     __ cmovq(greater_equal, rax, Operand(rdx, 1));
480     __ cmovq(less_equal, rax, Operand(rdx, 2));
481     __ cmovq(greater, rax, Operand(rdx, 3));
482   }
483 
484   {
485     if (CpuFeatures::IsSupported(SSE4_1)) {
486       CpuFeatureScope scope(&assm, SSE4_1);
487       __ extractps(rax, xmm1, 0);
488       __ pextrd(rbx, xmm15, 0);
489       __ pextrd(r12, xmm0, 1);
490       __ pinsrd(xmm9, r9, 0);
491       __ pinsrd(xmm5, rax, 1);
492     }
493   }
494 
495   // AVX instruction
496   {
497     if (CpuFeatures::IsSupported(AVX)) {
498       CpuFeatureScope scope(&assm, AVX);
499       __ vmovss(xmm6, xmm14, xmm2);
500       __ vmovss(xmm9, Operand(rbx, rcx, times_4, 10000));
501       __ vmovss(Operand(rbx, rcx, times_4, 10000), xmm0);
502 
503       __ vaddss(xmm0, xmm1, xmm2);
504       __ vaddss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
505       __ vmulss(xmm0, xmm1, xmm2);
506       __ vmulss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
507       __ vsubss(xmm0, xmm1, xmm2);
508       __ vsubss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
509       __ vdivss(xmm0, xmm1, xmm2);
510       __ vdivss(xmm0, xmm1, Operand(rbx, rcx, times_2, 10000));
511       __ vminss(xmm8, xmm1, xmm2);
512       __ vminss(xmm9, xmm1, Operand(rbx, rcx, times_8, 10000));
513       __ vmaxss(xmm8, xmm1, xmm2);
514       __ vmaxss(xmm9, xmm1, Operand(rbx, rcx, times_1, 10000));
515       __ vmovss(xmm9, Operand(r11, rcx, times_8, -10000));
516       __ vmovss(Operand(rbx, r9, times_4, 10000), xmm1);
517       __ vucomiss(xmm9, xmm1);
518       __ vucomiss(xmm8, Operand(rbx, rdx, times_2, 10981));
519 
520       __ vmovd(xmm5, rdi);
521       __ vmovd(xmm9, Operand(rbx, rcx, times_4, 10000));
522       __ vmovd(r9, xmm6);
523       __ vmovq(xmm5, rdi);
524       __ vmovq(xmm9, Operand(rbx, rcx, times_4, 10000));
525       __ vmovq(r9, xmm6);
526 
527       __ vmovsd(xmm6, xmm14, xmm2);
528       __ vmovsd(xmm9, Operand(rbx, rcx, times_4, 10000));
529       __ vmovsd(Operand(rbx, rcx, times_4, 10000), xmm0);
530 
531       __ vaddsd(xmm0, xmm1, xmm2);
532       __ vaddsd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
533       __ vmulsd(xmm0, xmm1, xmm2);
534       __ vmulsd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
535       __ vsubsd(xmm0, xmm1, xmm2);
536       __ vsubsd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
537       __ vdivsd(xmm0, xmm1, xmm2);
538       __ vdivsd(xmm0, xmm1, Operand(rbx, rcx, times_2, 10000));
539       __ vminsd(xmm8, xmm1, xmm2);
540       __ vminsd(xmm9, xmm1, Operand(rbx, rcx, times_8, 10000));
541       __ vmaxsd(xmm8, xmm1, xmm2);
542       __ vmaxsd(xmm9, xmm1, Operand(rbx, rcx, times_1, 10000));
543       __ vroundsd(xmm8, xmm3, xmm0, kRoundDown);
544       __ vsqrtsd(xmm8, xmm1, xmm2);
545       __ vsqrtsd(xmm9, xmm1, Operand(rbx, rcx, times_1, 10000));
546       __ vucomisd(xmm9, xmm1);
547       __ vucomisd(xmm8, Operand(rbx, rdx, times_2, 10981));
548 
549       __ vcvtss2sd(xmm4, xmm9, xmm11);
550       __ vcvtsd2ss(xmm9, xmm3, xmm2);
551       __ vcvtss2sd(xmm4, xmm9, Operand(rbx, rcx, times_1, 10000));
552       __ vcvtsd2ss(xmm9, xmm3, Operand(rbx, rcx, times_1, 10000));
553       __ vcvtlsi2sd(xmm5, xmm9, rcx);
554       __ vcvtlsi2sd(xmm9, xmm3, Operand(rbx, r9, times_4, 10000));
555       __ vcvtqsi2sd(xmm5, xmm9, r11);
556       __ vcvttsd2si(r9, xmm6);
557       __ vcvttsd2si(rax, Operand(rbx, r9, times_4, 10000));
558       __ vcvttsd2siq(rdi, xmm9);
559       __ vcvttsd2siq(r8, Operand(r9, rbx, times_4, 10000));
560       __ vcvtsd2si(rdi, xmm9);
561 
562       __ vmovaps(xmm10, xmm11);
563       __ vmovapd(xmm7, xmm0);
564       __ vmovmskpd(r9, xmm4);
565 
566       __ vandps(xmm0, xmm9, xmm2);
567       __ vandps(xmm9, xmm1, Operand(rbx, rcx, times_4, 10000));
568       __ vxorps(xmm0, xmm1, xmm9);
569       __ vxorps(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
570 
571       __ vandpd(xmm0, xmm9, xmm2);
572       __ vandpd(xmm9, xmm1, Operand(rbx, rcx, times_4, 10000));
573       __ vorpd(xmm0, xmm1, xmm9);
574       __ vorpd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
575       __ vxorpd(xmm0, xmm1, xmm9);
576       __ vxorpd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
577 
578       __ vpcmpeqd(xmm0, xmm15, xmm5);
579       __ vpcmpeqd(xmm15, xmm0, Operand(rbx, rcx, times_4, 10000));
580       __ vpsllq(xmm0, xmm15, 21);
581       __ vpsrlq(xmm15, xmm0, 21);
582     }
583   }
584 
585   // FMA3 instruction
586   {
587     if (CpuFeatures::IsSupported(FMA3)) {
588       CpuFeatureScope scope(&assm, FMA3);
589       __ vfmadd132sd(xmm0, xmm1, xmm2);
590       __ vfmadd132sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
591       __ vfmadd213sd(xmm0, xmm1, xmm2);
592       __ vfmadd213sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
593       __ vfmadd231sd(xmm0, xmm1, xmm2);
594       __ vfmadd231sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
595 
596       __ vfmadd132sd(xmm9, xmm10, xmm11);
597       __ vfmadd132sd(xmm9, xmm10, Operand(r9, r11, times_4, 10000));
598       __ vfmadd213sd(xmm9, xmm10, xmm11);
599       __ vfmadd213sd(xmm9, xmm10, Operand(r9, r11, times_4, 10000));
600       __ vfmadd231sd(xmm9, xmm10, xmm11);
601       __ vfmadd231sd(xmm9, xmm10, Operand(r9, r11, times_4, 10000));
602 
603       __ vfmsub132sd(xmm0, xmm1, xmm2);
604       __ vfmsub132sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
605       __ vfmsub213sd(xmm0, xmm1, xmm2);
606       __ vfmsub213sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
607       __ vfmsub231sd(xmm0, xmm1, xmm2);
608       __ vfmsub231sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
609 
610       __ vfnmadd132sd(xmm0, xmm1, xmm2);
611       __ vfnmadd132sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
612       __ vfnmadd213sd(xmm0, xmm1, xmm2);
613       __ vfnmadd213sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
614       __ vfnmadd231sd(xmm0, xmm1, xmm2);
615       __ vfnmadd231sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
616 
617       __ vfnmsub132sd(xmm0, xmm1, xmm2);
618       __ vfnmsub132sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
619       __ vfnmsub213sd(xmm0, xmm1, xmm2);
620       __ vfnmsub213sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
621       __ vfnmsub231sd(xmm0, xmm1, xmm2);
622       __ vfnmsub231sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
623 
624       __ vfmadd132ss(xmm0, xmm1, xmm2);
625       __ vfmadd132ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
626       __ vfmadd213ss(xmm0, xmm1, xmm2);
627       __ vfmadd213ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
628       __ vfmadd231ss(xmm0, xmm1, xmm2);
629       __ vfmadd231ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
630 
631       __ vfmsub132ss(xmm0, xmm1, xmm2);
632       __ vfmsub132ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
633       __ vfmsub213ss(xmm0, xmm1, xmm2);
634       __ vfmsub213ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
635       __ vfmsub231ss(xmm0, xmm1, xmm2);
636       __ vfmsub231ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
637 
638       __ vfnmadd132ss(xmm0, xmm1, xmm2);
639       __ vfnmadd132ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
640       __ vfnmadd213ss(xmm0, xmm1, xmm2);
641       __ vfnmadd213ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
642       __ vfnmadd231ss(xmm0, xmm1, xmm2);
643       __ vfnmadd231ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
644 
645       __ vfnmsub132ss(xmm0, xmm1, xmm2);
646       __ vfnmsub132ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
647       __ vfnmsub213ss(xmm0, xmm1, xmm2);
648       __ vfnmsub213ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
649       __ vfnmsub231ss(xmm0, xmm1, xmm2);
650       __ vfnmsub231ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
651     }
652   }
653 
654   // BMI1 instructions
655   {
656     if (CpuFeatures::IsSupported(BMI1)) {
657       CpuFeatureScope scope(&assm, BMI1);
658       __ andnq(rax, rbx, rcx);
659       __ andnq(rax, rbx, Operand(rbx, rcx, times_4, 10000));
660       __ andnl(rax, rbx, rcx);
661       __ andnl(rax, rbx, Operand(rbx, rcx, times_4, 10000));
662       __ bextrq(rax, rbx, rcx);
663       __ bextrq(rax, Operand(rbx, rcx, times_4, 10000), rbx);
664       __ bextrl(rax, rbx, rcx);
665       __ bextrl(rax, Operand(rbx, rcx, times_4, 10000), rbx);
666       __ blsiq(rax, rbx);
667       __ blsiq(rax, Operand(rbx, rcx, times_4, 10000));
668       __ blsil(rax, rbx);
669       __ blsil(rax, Operand(rbx, rcx, times_4, 10000));
670       __ blsmskq(rax, rbx);
671       __ blsmskq(rax, Operand(rbx, rcx, times_4, 10000));
672       __ blsmskl(rax, rbx);
673       __ blsmskl(rax, Operand(rbx, rcx, times_4, 10000));
674       __ blsrq(rax, rbx);
675       __ blsrq(rax, Operand(rbx, rcx, times_4, 10000));
676       __ blsrl(rax, rbx);
677       __ blsrl(rax, Operand(rbx, rcx, times_4, 10000));
678       __ tzcntq(rax, rbx);
679       __ tzcntq(rax, Operand(rbx, rcx, times_4, 10000));
680       __ tzcntl(rax, rbx);
681       __ tzcntl(rax, Operand(rbx, rcx, times_4, 10000));
682     }
683   }
684 
685   // LZCNT instructions
686   {
687     if (CpuFeatures::IsSupported(LZCNT)) {
688       CpuFeatureScope scope(&assm, LZCNT);
689       __ lzcntq(rax, rbx);
690       __ lzcntq(rax, Operand(rbx, rcx, times_4, 10000));
691       __ lzcntl(rax, rbx);
692       __ lzcntl(rax, Operand(rbx, rcx, times_4, 10000));
693     }
694   }
695 
696   // POPCNT instructions
697   {
698     if (CpuFeatures::IsSupported(POPCNT)) {
699       CpuFeatureScope scope(&assm, POPCNT);
700       __ popcntq(rax, rbx);
701       __ popcntq(rax, Operand(rbx, rcx, times_4, 10000));
702       __ popcntl(rax, rbx);
703       __ popcntl(rax, Operand(rbx, rcx, times_4, 10000));
704     }
705   }
706 
707   // BMI2 instructions
708   {
709     if (CpuFeatures::IsSupported(BMI2)) {
710       CpuFeatureScope scope(&assm, BMI2);
711       __ bzhiq(rax, rbx, rcx);
712       __ bzhiq(rax, Operand(rbx, rcx, times_4, 10000), rbx);
713       __ bzhil(rax, rbx, rcx);
714       __ bzhil(rax, Operand(rbx, rcx, times_4, 10000), rbx);
715       __ mulxq(rax, rbx, rcx);
716       __ mulxq(rax, rbx, Operand(rbx, rcx, times_4, 10000));
717       __ mulxl(rax, rbx, rcx);
718       __ mulxl(rax, rbx, Operand(rbx, rcx, times_4, 10000));
719       __ pdepq(rax, rbx, rcx);
720       __ pdepq(rax, rbx, Operand(rbx, rcx, times_4, 10000));
721       __ pdepl(rax, rbx, rcx);
722       __ pdepl(rax, rbx, Operand(rbx, rcx, times_4, 10000));
723       __ pextq(rax, rbx, rcx);
724       __ pextq(rax, rbx, Operand(rbx, rcx, times_4, 10000));
725       __ pextl(rax, rbx, rcx);
726       __ pextl(rax, rbx, Operand(rbx, rcx, times_4, 10000));
727       __ sarxq(rax, rbx, rcx);
728       __ sarxq(rax, Operand(rbx, rcx, times_4, 10000), rbx);
729       __ sarxl(rax, rbx, rcx);
730       __ sarxl(rax, Operand(rbx, rcx, times_4, 10000), rbx);
731       __ shlxq(rax, rbx, rcx);
732       __ shlxq(rax, Operand(rbx, rcx, times_4, 10000), rbx);
733       __ shlxl(rax, rbx, rcx);
734       __ shlxl(rax, Operand(rbx, rcx, times_4, 10000), rbx);
735       __ shrxq(rax, rbx, rcx);
736       __ shrxq(rax, Operand(rbx, rcx, times_4, 10000), rbx);
737       __ shrxl(rax, rbx, rcx);
738       __ shrxl(rax, Operand(rbx, rcx, times_4, 10000), rbx);
739       __ rorxq(rax, rbx, 63);
740       __ rorxq(rax, Operand(rbx, rcx, times_4, 10000), 63);
741       __ rorxl(rax, rbx, 31);
742       __ rorxl(rax, Operand(rbx, rcx, times_4, 10000), 31);
743     }
744   }
745 
746   // xchg.
747   {
748     __ xchgq(rax, rax);
749     __ xchgq(rax, rbx);
750     __ xchgq(rbx, rbx);
751     __ xchgq(rbx, Operand(rsp, 12));
752   }
753 
754   // Nop instructions
755   for (int i = 0; i < 16; i++) {
756     __ Nop(i);
757   }
758 
759   __ ret(0);
760 
761   CodeDesc desc;
762   assm.GetCode(&desc);
763   Handle<Code> code = isolate->factory()->NewCode(
764       desc, Code::ComputeFlags(Code::STUB), Handle<Code>());
765   USE(code);
766 #ifdef OBJECT_PRINT
767   OFStream os(stdout);
768   code->Print(os);
769   byte* begin = code->instruction_start();
770   byte* end = begin + code->instruction_size();
771   disasm::Disassembler::Disassemble(stdout, begin, end);
772 #endif
773 }
774 
775 #undef __
776