99f8d57f3c
Basically recognize certain x < y ? x : y constructs and turn that into Float64Min/Float64Max operations, if the target machine supports that. On x86 we lower to (v)minsd/(v)maxsd. R=dcarney@chromium.org Review URL: https://codereview.chromium.org/998283002 Cr-Commit-Position: refs/heads/master@{#27160}
606 lines
19 KiB
C++
606 lines
19 KiB
C++
// Copyright 2011 the V8 project authors. All rights reserved.
|
|
// Redistribution and use in source and binary forms, with or without
|
|
// modification, are permitted provided that the following conditions are
|
|
// met:
|
|
//
|
|
// * Redistributions of source code must retain the above copyright
|
|
// notice, this list of conditions and the following disclaimer.
|
|
// * Redistributions in binary form must reproduce the above
|
|
// copyright notice, this list of conditions and the following
|
|
// disclaimer in the documentation and/or other materials provided
|
|
// with the distribution.
|
|
// * Neither the name of Google Inc. nor the names of its
|
|
// contributors may be used to endorse or promote products derived
|
|
// from this software without specific prior written permission.
|
|
//
|
|
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include "src/v8.h"
|
|
|
|
#include "src/debug.h"
|
|
#include "src/disasm.h"
|
|
#include "src/disassembler.h"
|
|
#include "src/ic/ic.h"
|
|
#include "src/macro-assembler.h"
|
|
#include "src/serialize.h"
|
|
#include "test/cctest/cctest.h"
|
|
|
|
using namespace v8::internal;
|
|
|
|
|
|
#define __ assm.
|
|
|
|
|
|
static void DummyStaticFunction(Object* result) {
|
|
}
|
|
|
|
|
|
TEST(DisasmX64) {
|
|
CcTest::InitializeVM();
|
|
Isolate* isolate = CcTest::i_isolate();
|
|
HandleScope scope(isolate);
|
|
v8::internal::byte buffer[4096];
|
|
Assembler assm(isolate, buffer, sizeof buffer);
|
|
DummyStaticFunction(NULL); // just bloody use it (DELETE; debugging)
|
|
|
|
// Short immediate instructions
|
|
__ addq(rax, Immediate(12345678));
|
|
__ orq(rax, Immediate(12345678));
|
|
__ subq(rax, Immediate(12345678));
|
|
__ xorq(rax, Immediate(12345678));
|
|
__ andq(rax, Immediate(12345678));
|
|
|
|
// ---- This one caused crash
|
|
__ movq(rbx, Operand(rsp, rcx, times_2, 0)); // [rsp+rcx*4]
|
|
|
|
// ---- All instructions that I can think of
|
|
__ addq(rdx, rbx);
|
|
__ addq(rdx, Operand(rbx, 0));
|
|
__ addq(rdx, Operand(rbx, 16));
|
|
__ addq(rdx, Operand(rbx, 1999));
|
|
__ addq(rdx, Operand(rbx, -4));
|
|
__ addq(rdx, Operand(rbx, -1999));
|
|
__ addq(rdx, Operand(rsp, 0));
|
|
__ addq(rdx, Operand(rsp, 16));
|
|
__ addq(rdx, Operand(rsp, 1999));
|
|
__ addq(rdx, Operand(rsp, -4));
|
|
__ addq(rdx, Operand(rsp, -1999));
|
|
__ nop();
|
|
__ addq(rsi, Operand(rcx, times_4, 0));
|
|
__ addq(rsi, Operand(rcx, times_4, 24));
|
|
__ addq(rsi, Operand(rcx, times_4, -4));
|
|
__ addq(rsi, Operand(rcx, times_4, -1999));
|
|
__ nop();
|
|
__ addq(rdi, Operand(rbp, rcx, times_4, 0));
|
|
__ addq(rdi, Operand(rbp, rcx, times_4, 12));
|
|
__ addq(rdi, Operand(rbp, rcx, times_4, -8));
|
|
__ addq(rdi, Operand(rbp, rcx, times_4, -3999));
|
|
__ addq(Operand(rbp, rcx, times_4, 12), Immediate(12));
|
|
|
|
__ nop();
|
|
__ addq(rbx, Immediate(12));
|
|
__ nop();
|
|
__ nop();
|
|
__ andq(rdx, Immediate(3));
|
|
__ andq(rdx, Operand(rsp, 4));
|
|
__ cmpq(rdx, Immediate(3));
|
|
__ cmpq(rdx, Operand(rsp, 4));
|
|
__ cmpq(Operand(rbp, rcx, times_4, 0), Immediate(1000));
|
|
__ cmpb(rbx, Operand(rbp, rcx, times_2, 0));
|
|
__ cmpb(Operand(rbp, rcx, times_2, 0), rbx);
|
|
__ orq(rdx, Immediate(3));
|
|
__ xorq(rdx, Immediate(3));
|
|
__ nop();
|
|
__ cpuid();
|
|
__ movsxbl(rdx, Operand(rcx, 0));
|
|
__ movsxbq(rdx, Operand(rcx, 0));
|
|
__ movsxwl(rdx, Operand(rcx, 0));
|
|
__ movsxwq(rdx, Operand(rcx, 0));
|
|
__ movzxbl(rdx, Operand(rcx, 0));
|
|
__ movzxwl(rdx, Operand(rcx, 0));
|
|
__ movzxbq(rdx, Operand(rcx, 0));
|
|
__ movzxwq(rdx, Operand(rcx, 0));
|
|
|
|
__ nop();
|
|
__ imulq(rdx, rcx);
|
|
__ shld(rdx, rcx);
|
|
__ shrd(rdx, rcx);
|
|
__ shlq(Operand(rdi, rax, times_4, 100), Immediate(1));
|
|
__ shlq(Operand(rdi, rax, times_4, 100), Immediate(6));
|
|
__ shlq(Operand(r15, 0), Immediate(1));
|
|
__ shlq(Operand(r15, 0), Immediate(6));
|
|
__ shlq_cl(Operand(r15, 0));
|
|
__ shlq_cl(Operand(r15, 0));
|
|
__ shlq_cl(Operand(rdi, rax, times_4, 100));
|
|
__ shlq_cl(Operand(rdi, rax, times_4, 100));
|
|
__ shlq(rdx, Immediate(1));
|
|
__ shlq(rdx, Immediate(6));
|
|
__ shll(Operand(rdi, rax, times_4, 100), Immediate(1));
|
|
__ shll(Operand(rdi, rax, times_4, 100), Immediate(6));
|
|
__ shll(Operand(r15, 0), Immediate(1));
|
|
__ shll(Operand(r15, 0), Immediate(6));
|
|
__ shll_cl(Operand(r15, 0));
|
|
__ shll_cl(Operand(r15, 0));
|
|
__ shll_cl(Operand(rdi, rax, times_4, 100));
|
|
__ shll_cl(Operand(rdi, rax, times_4, 100));
|
|
__ shll(rdx, Immediate(1));
|
|
__ shll(rdx, Immediate(6));
|
|
__ bts(Operand(rdx, 0), rcx);
|
|
__ bts(Operand(rbx, rcx, times_4, 0), rcx);
|
|
__ nop();
|
|
__ pushq(Immediate(12));
|
|
__ pushq(Immediate(23456));
|
|
__ pushq(rcx);
|
|
__ pushq(rsi);
|
|
__ pushq(Operand(rbp, JavaScriptFrameConstants::kFunctionOffset));
|
|
__ pushq(Operand(rbx, rcx, times_4, 0));
|
|
__ pushq(Operand(rbx, rcx, times_4, 0));
|
|
__ pushq(Operand(rbx, rcx, times_4, 10000));
|
|
__ popq(rdx);
|
|
__ popq(rax);
|
|
__ popq(Operand(rbx, rcx, times_4, 0));
|
|
__ nop();
|
|
|
|
__ addq(rdx, Operand(rsp, 16));
|
|
__ addq(rdx, rcx);
|
|
__ movb(rdx, Operand(rcx, 0));
|
|
__ movb(rcx, Immediate(6));
|
|
__ movb(Operand(rsp, 16), rdx);
|
|
__ movw(Operand(rsp, 16), rdx);
|
|
__ nop();
|
|
__ movsxwq(rdx, Operand(rsp, 12));
|
|
__ movsxbq(rdx, Operand(rsp, 12));
|
|
__ movsxlq(rdx, Operand(rsp, 12));
|
|
__ movzxwq(rdx, Operand(rsp, 12));
|
|
__ movzxbq(rdx, Operand(rsp, 12));
|
|
__ nop();
|
|
__ movq(rdx, Immediate(1234567));
|
|
__ movq(rdx, Operand(rsp, 12));
|
|
__ movq(Operand(rbx, rcx, times_4, 10000), Immediate(12345));
|
|
__ movq(Operand(rbx, rcx, times_4, 10000), rdx);
|
|
__ nop();
|
|
__ decb(rdx);
|
|
__ decb(Operand(rax, 10));
|
|
__ decb(Operand(rbx, rcx, times_4, 10000));
|
|
__ decq(rdx);
|
|
__ cdq();
|
|
|
|
__ nop();
|
|
__ idivq(rdx);
|
|
__ mull(rdx);
|
|
__ mulq(rdx);
|
|
__ negq(rdx);
|
|
__ notq(rdx);
|
|
__ testq(Operand(rbx, rcx, times_4, 10000), rdx);
|
|
|
|
__ imulq(rdx, rcx, Immediate(12));
|
|
__ imulq(rdx, rcx, Immediate(1000));
|
|
__ imulq(rdx, Operand(rbx, rcx, times_4, 10000));
|
|
__ imulq(rdx, Operand(rbx, rcx, times_4, 10000), Immediate(12));
|
|
__ imulq(rdx, Operand(rbx, rcx, times_4, 10000), Immediate(1000));
|
|
__ imull(r15, rcx, Immediate(12));
|
|
__ imull(r15, rcx, Immediate(1000));
|
|
__ imull(r15, Operand(rbx, rcx, times_4, 10000));
|
|
__ imull(r15, Operand(rbx, rcx, times_4, 10000), Immediate(12));
|
|
__ imull(r15, Operand(rbx, rcx, times_4, 10000), Immediate(1000));
|
|
|
|
__ incq(rdx);
|
|
__ incq(Operand(rbx, rcx, times_4, 10000));
|
|
__ pushq(Operand(rbx, rcx, times_4, 10000));
|
|
__ popq(Operand(rbx, rcx, times_4, 10000));
|
|
// TODO(mstarzinger): The following is protected.
|
|
// __ jmp(Operand(rbx, rcx, times_4, 10000));
|
|
|
|
__ leaq(rdx, Operand(rbx, rcx, times_4, 10000));
|
|
__ orq(rdx, Immediate(12345));
|
|
__ orq(rdx, Operand(rbx, rcx, times_4, 10000));
|
|
|
|
__ nop();
|
|
|
|
__ rclq(rdx, Immediate(1));
|
|
__ rclq(rdx, Immediate(7));
|
|
__ rcrq(rdx, Immediate(1));
|
|
__ rcrq(rdx, Immediate(7));
|
|
__ sarq(rdx, Immediate(1));
|
|
__ sarq(rdx, Immediate(6));
|
|
__ sarq_cl(rdx);
|
|
__ sbbq(rdx, rbx);
|
|
__ shld(rdx, rbx);
|
|
__ shlq(rdx, Immediate(1));
|
|
__ shlq(rdx, Immediate(6));
|
|
__ shlq_cl(rdx);
|
|
__ shrd(rdx, rbx);
|
|
__ shrq(rdx, Immediate(1));
|
|
__ shrq(rdx, Immediate(7));
|
|
__ shrq_cl(rdx);
|
|
|
|
|
|
// Immediates
|
|
|
|
__ addq(rbx, Immediate(12));
|
|
__ addq(Operand(rdx, rcx, times_4, 10000), Immediate(12));
|
|
|
|
__ andq(rbx, Immediate(12345));
|
|
|
|
__ cmpq(rbx, Immediate(12345));
|
|
__ cmpq(rbx, Immediate(12));
|
|
__ cmpq(Operand(rdx, rcx, times_4, 10000), Immediate(12));
|
|
__ cmpb(rax, Immediate(100));
|
|
|
|
__ orq(rbx, Immediate(12345));
|
|
|
|
__ subq(rbx, Immediate(12));
|
|
__ subq(Operand(rdx, rcx, times_4, 10000), Immediate(12));
|
|
|
|
__ xorq(rbx, Immediate(12345));
|
|
|
|
__ imulq(rdx, rcx, Immediate(12));
|
|
__ imulq(rdx, rcx, Immediate(1000));
|
|
|
|
__ cld();
|
|
|
|
__ subq(rdx, Operand(rbx, rcx, times_4, 10000));
|
|
__ subq(rdx, rbx);
|
|
|
|
__ testq(rdx, Immediate(12345));
|
|
__ testq(Operand(rbx, rcx, times_8, 10000), rdx);
|
|
__ testb(Operand(rcx, rbx, times_2, 1000), rdx);
|
|
__ testb(Operand(rax, -20), Immediate(0x9A));
|
|
__ nop();
|
|
|
|
__ xorq(rdx, Immediate(12345));
|
|
__ xorq(rdx, Operand(rbx, rcx, times_8, 10000));
|
|
__ bts(Operand(rbx, rcx, times_8, 10000), rdx);
|
|
__ hlt();
|
|
__ int3();
|
|
__ ret(0);
|
|
__ ret(8);
|
|
|
|
// Calls
|
|
|
|
Label L1, L2;
|
|
__ bind(&L1);
|
|
__ nop();
|
|
__ call(&L1);
|
|
__ call(&L2);
|
|
__ nop();
|
|
__ bind(&L2);
|
|
// TODO(mstarzinger): The following is protected.
|
|
// __ call(Operand(rbx, rcx, times_4, 10000));
|
|
__ nop();
|
|
Handle<Code> ic(LoadIC::initialize_stub(isolate, NOT_CONTEXTUAL));
|
|
__ call(ic, RelocInfo::CODE_TARGET);
|
|
__ nop();
|
|
__ nop();
|
|
|
|
__ jmp(&L1);
|
|
// TODO(mstarzinger): The following is protected.
|
|
// __ jmp(Operand(rbx, rcx, times_4, 10000));
|
|
ExternalReference after_break_target =
|
|
ExternalReference::debug_after_break_target_address(isolate);
|
|
USE(after_break_target);
|
|
__ jmp(ic, RelocInfo::CODE_TARGET);
|
|
__ nop();
|
|
|
|
|
|
Label Ljcc;
|
|
__ nop();
|
|
// long jumps
|
|
__ j(overflow, &Ljcc);
|
|
__ j(no_overflow, &Ljcc);
|
|
__ j(below, &Ljcc);
|
|
__ j(above_equal, &Ljcc);
|
|
__ j(equal, &Ljcc);
|
|
__ j(not_equal, &Ljcc);
|
|
__ j(below_equal, &Ljcc);
|
|
__ j(above, &Ljcc);
|
|
__ j(sign, &Ljcc);
|
|
__ j(not_sign, &Ljcc);
|
|
__ j(parity_even, &Ljcc);
|
|
__ j(parity_odd, &Ljcc);
|
|
__ j(less, &Ljcc);
|
|
__ j(greater_equal, &Ljcc);
|
|
__ j(less_equal, &Ljcc);
|
|
__ j(greater, &Ljcc);
|
|
__ nop();
|
|
__ bind(&Ljcc);
|
|
// short jumps
|
|
__ j(overflow, &Ljcc);
|
|
__ j(no_overflow, &Ljcc);
|
|
__ j(below, &Ljcc);
|
|
__ j(above_equal, &Ljcc);
|
|
__ j(equal, &Ljcc);
|
|
__ j(not_equal, &Ljcc);
|
|
__ j(below_equal, &Ljcc);
|
|
__ j(above, &Ljcc);
|
|
__ j(sign, &Ljcc);
|
|
__ j(not_sign, &Ljcc);
|
|
__ j(parity_even, &Ljcc);
|
|
__ j(parity_odd, &Ljcc);
|
|
__ j(less, &Ljcc);
|
|
__ j(greater_equal, &Ljcc);
|
|
__ j(less_equal, &Ljcc);
|
|
__ j(greater, &Ljcc);
|
|
|
|
// 0xD9 instructions
|
|
__ nop();
|
|
|
|
__ fld(1);
|
|
__ fld1();
|
|
__ fldz();
|
|
__ fldpi();
|
|
__ fabs();
|
|
__ fchs();
|
|
__ fprem();
|
|
__ fprem1();
|
|
__ fincstp();
|
|
__ ftst();
|
|
__ fxch(3);
|
|
__ fld_s(Operand(rbx, rcx, times_4, 10000));
|
|
__ fstp_s(Operand(rbx, rcx, times_4, 10000));
|
|
__ ffree(3);
|
|
__ fld_d(Operand(rbx, rcx, times_4, 10000));
|
|
__ fstp_d(Operand(rbx, rcx, times_4, 10000));
|
|
__ nop();
|
|
|
|
__ fild_s(Operand(rbx, rcx, times_4, 10000));
|
|
__ fistp_s(Operand(rbx, rcx, times_4, 10000));
|
|
__ fild_d(Operand(rbx, rcx, times_4, 10000));
|
|
__ fistp_d(Operand(rbx, rcx, times_4, 10000));
|
|
__ fnstsw_ax();
|
|
__ nop();
|
|
__ fadd(3);
|
|
__ fsub(3);
|
|
__ fmul(3);
|
|
__ fdiv(3);
|
|
|
|
__ faddp(3);
|
|
__ fsubp(3);
|
|
__ fmulp(3);
|
|
__ fdivp(3);
|
|
__ fcompp();
|
|
__ fwait();
|
|
__ frndint();
|
|
__ fninit();
|
|
__ nop();
|
|
|
|
// SSE instruction
|
|
{
|
|
// Move operation
|
|
__ cvttss2si(rdx, Operand(rbx, rcx, times_4, 10000));
|
|
__ cvttss2si(rdx, xmm1);
|
|
__ cvtsd2ss(xmm0, xmm1);
|
|
__ cvtsd2ss(xmm0, Operand(rbx, rcx, times_4, 10000));
|
|
__ movaps(xmm0, xmm1);
|
|
|
|
// logic operation
|
|
__ andps(xmm0, xmm1);
|
|
__ andps(xmm0, Operand(rbx, rcx, times_4, 10000));
|
|
__ orps(xmm0, xmm1);
|
|
__ orps(xmm0, Operand(rbx, rcx, times_4, 10000));
|
|
__ xorps(xmm0, xmm1);
|
|
__ xorps(xmm0, Operand(rbx, rcx, times_4, 10000));
|
|
|
|
// Arithmetic operation
|
|
__ addss(xmm1, xmm0);
|
|
__ addss(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ mulss(xmm1, xmm0);
|
|
__ mulss(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ subss(xmm1, xmm0);
|
|
__ subss(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ divss(xmm1, xmm0);
|
|
__ divss(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ addps(xmm1, xmm0);
|
|
__ addps(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ subps(xmm1, xmm0);
|
|
__ subps(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ mulps(xmm1, xmm0);
|
|
__ mulps(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ divps(xmm1, xmm0);
|
|
__ divps(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
|
|
__ ucomiss(xmm0, xmm1);
|
|
__ ucomiss(xmm0, Operand(rbx, rcx, times_4, 10000));
|
|
}
|
|
// SSE 2 instructions
|
|
{
|
|
__ cvttsd2si(rdx, Operand(rbx, rcx, times_4, 10000));
|
|
__ cvttsd2si(rdx, xmm1);
|
|
__ cvttsd2siq(rdx, xmm1);
|
|
__ cvttsd2siq(rdx, Operand(rbx, rcx, times_4, 10000));
|
|
__ cvtqsi2sd(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ cvtqsi2sd(xmm1, rdx);
|
|
__ movsd(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ movsd(Operand(rbx, rcx, times_4, 10000), xmm1);
|
|
// 128 bit move instructions.
|
|
__ movdqa(xmm0, Operand(rbx, rcx, times_4, 10000));
|
|
__ movdqa(Operand(rbx, rcx, times_4, 10000), xmm0);
|
|
|
|
__ addsd(xmm1, xmm0);
|
|
__ addsd(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ mulsd(xmm1, xmm0);
|
|
__ mulsd(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ subsd(xmm1, xmm0);
|
|
__ subsd(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ divsd(xmm1, xmm0);
|
|
__ divsd(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ minsd(xmm1, xmm0);
|
|
__ minsd(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ maxsd(xmm1, xmm0);
|
|
__ maxsd(xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ ucomisd(xmm0, xmm1);
|
|
|
|
__ andpd(xmm0, xmm1);
|
|
|
|
__ pslld(xmm0, 6);
|
|
__ psrld(xmm0, 6);
|
|
__ psllq(xmm0, 6);
|
|
__ psrlq(xmm0, 6);
|
|
|
|
__ pcmpeqd(xmm1, xmm0);
|
|
|
|
__ punpckldq(xmm1, xmm11);
|
|
__ punpckhdq(xmm8, xmm15);
|
|
}
|
|
|
|
// cmov.
|
|
{
|
|
__ cmovq(overflow, rax, Operand(rax, 0));
|
|
__ cmovq(no_overflow, rax, Operand(rax, 1));
|
|
__ cmovq(below, rax, Operand(rax, 2));
|
|
__ cmovq(above_equal, rax, Operand(rax, 3));
|
|
__ cmovq(equal, rax, Operand(rbx, 0));
|
|
__ cmovq(not_equal, rax, Operand(rbx, 1));
|
|
__ cmovq(below_equal, rax, Operand(rbx, 2));
|
|
__ cmovq(above, rax, Operand(rbx, 3));
|
|
__ cmovq(sign, rax, Operand(rcx, 0));
|
|
__ cmovq(not_sign, rax, Operand(rcx, 1));
|
|
__ cmovq(parity_even, rax, Operand(rcx, 2));
|
|
__ cmovq(parity_odd, rax, Operand(rcx, 3));
|
|
__ cmovq(less, rax, Operand(rdx, 0));
|
|
__ cmovq(greater_equal, rax, Operand(rdx, 1));
|
|
__ cmovq(less_equal, rax, Operand(rdx, 2));
|
|
__ cmovq(greater, rax, Operand(rdx, 3));
|
|
}
|
|
|
|
{
|
|
if (CpuFeatures::IsSupported(SSE4_1)) {
|
|
CpuFeatureScope scope(&assm, SSE4_1);
|
|
__ extractps(rax, xmm1, 0);
|
|
__ pextrd(rbx, xmm15, 0);
|
|
__ pextrd(r12, xmm0, 1);
|
|
__ pinsrd(xmm9, r9, 0);
|
|
__ pinsrd(xmm5, rax, 1);
|
|
}
|
|
}
|
|
|
|
// AVX instruction
|
|
{
|
|
if (CpuFeatures::IsSupported(AVX)) {
|
|
CpuFeatureScope scope(&assm, AVX);
|
|
__ vaddsd(xmm0, xmm1, xmm2);
|
|
__ vaddsd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vmulsd(xmm0, xmm1, xmm2);
|
|
__ vmulsd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vsubsd(xmm0, xmm1, xmm2);
|
|
__ vsubsd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vdivsd(xmm0, xmm1, xmm2);
|
|
__ vdivsd(xmm0, xmm1, Operand(rbx, rcx, times_2, 10000));
|
|
__ vminsd(xmm8, xmm1, xmm2);
|
|
__ vminsd(xmm9, xmm1, Operand(rbx, rcx, times_8, 10000));
|
|
__ vmaxsd(xmm8, xmm1, xmm2);
|
|
__ vmaxsd(xmm9, xmm1, Operand(rbx, rcx, times_1, 10000));
|
|
}
|
|
}
|
|
|
|
// FMA3 instruction
|
|
{
|
|
if (CpuFeatures::IsSupported(FMA3)) {
|
|
CpuFeatureScope scope(&assm, FMA3);
|
|
__ vfmadd132sd(xmm0, xmm1, xmm2);
|
|
__ vfmadd132sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfmadd213sd(xmm0, xmm1, xmm2);
|
|
__ vfmadd213sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfmadd231sd(xmm0, xmm1, xmm2);
|
|
__ vfmadd231sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
|
|
__ vfmadd132sd(xmm9, xmm10, xmm11);
|
|
__ vfmadd132sd(xmm9, xmm10, Operand(r9, r11, times_4, 10000));
|
|
__ vfmadd213sd(xmm9, xmm10, xmm11);
|
|
__ vfmadd213sd(xmm9, xmm10, Operand(r9, r11, times_4, 10000));
|
|
__ vfmadd231sd(xmm9, xmm10, xmm11);
|
|
__ vfmadd231sd(xmm9, xmm10, Operand(r9, r11, times_4, 10000));
|
|
|
|
__ vfmsub132sd(xmm0, xmm1, xmm2);
|
|
__ vfmsub132sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfmsub213sd(xmm0, xmm1, xmm2);
|
|
__ vfmsub213sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfmsub231sd(xmm0, xmm1, xmm2);
|
|
__ vfmsub231sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
|
|
__ vfnmadd132sd(xmm0, xmm1, xmm2);
|
|
__ vfnmadd132sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfnmadd213sd(xmm0, xmm1, xmm2);
|
|
__ vfnmadd213sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfnmadd231sd(xmm0, xmm1, xmm2);
|
|
__ vfnmadd231sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
|
|
__ vfnmsub132sd(xmm0, xmm1, xmm2);
|
|
__ vfnmsub132sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfnmsub213sd(xmm0, xmm1, xmm2);
|
|
__ vfnmsub213sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfnmsub231sd(xmm0, xmm1, xmm2);
|
|
__ vfnmsub231sd(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
|
|
__ vfmadd132ss(xmm0, xmm1, xmm2);
|
|
__ vfmadd132ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfmadd213ss(xmm0, xmm1, xmm2);
|
|
__ vfmadd213ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfmadd231ss(xmm0, xmm1, xmm2);
|
|
__ vfmadd231ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
|
|
__ vfmsub132ss(xmm0, xmm1, xmm2);
|
|
__ vfmsub132ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfmsub213ss(xmm0, xmm1, xmm2);
|
|
__ vfmsub213ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfmsub231ss(xmm0, xmm1, xmm2);
|
|
__ vfmsub231ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
|
|
__ vfnmadd132ss(xmm0, xmm1, xmm2);
|
|
__ vfnmadd132ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfnmadd213ss(xmm0, xmm1, xmm2);
|
|
__ vfnmadd213ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfnmadd231ss(xmm0, xmm1, xmm2);
|
|
__ vfnmadd231ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
|
|
__ vfnmsub132ss(xmm0, xmm1, xmm2);
|
|
__ vfnmsub132ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfnmsub213ss(xmm0, xmm1, xmm2);
|
|
__ vfnmsub213ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
__ vfnmsub231ss(xmm0, xmm1, xmm2);
|
|
__ vfnmsub231ss(xmm0, xmm1, Operand(rbx, rcx, times_4, 10000));
|
|
}
|
|
}
|
|
// xchg.
|
|
{
|
|
__ xchgq(rax, rax);
|
|
__ xchgq(rax, rbx);
|
|
__ xchgq(rbx, rbx);
|
|
__ xchgq(rbx, Operand(rsp, 12));
|
|
}
|
|
|
|
// Nop instructions
|
|
for (int i = 0; i < 16; i++) {
|
|
__ Nop(i);
|
|
}
|
|
|
|
__ ret(0);
|
|
|
|
CodeDesc desc;
|
|
assm.GetCode(&desc);
|
|
Handle<Code> code = isolate->factory()->NewCode(
|
|
desc, Code::ComputeFlags(Code::STUB), Handle<Code>());
|
|
USE(code);
|
|
#ifdef OBJECT_PRINT
|
|
OFStream os(stdout);
|
|
code->Print(os);
|
|
byte* begin = code->instruction_start();
|
|
byte* end = begin + code->instruction_size();
|
|
disasm::Disassembler::Disassemble(stdout, begin, end);
|
|
#endif
|
|
}
|
|
|
|
#undef __
|