2011-10-03 11:44:39 +00:00
|
|
|
// Copyright 2011 the V8 project authors. All rights reserved.
|
2008-08-22 13:33:59 +00:00
|
|
|
// Redistribution and use in source and binary forms, with or without
|
|
|
|
// modification, are permitted provided that the following conditions are
|
|
|
|
// met:
|
|
|
|
//
|
|
|
|
// * Redistributions of source code must retain the above copyright
|
|
|
|
// notice, this list of conditions and the following disclaimer.
|
|
|
|
// * Redistributions in binary form must reproduce the above
|
|
|
|
// copyright notice, this list of conditions and the following
|
|
|
|
// disclaimer in the documentation and/or other materials provided
|
|
|
|
// with the distribution.
|
|
|
|
// * Neither the name of Google Inc. nor the names of its
|
|
|
|
// contributors may be used to endorse or promote products derived
|
|
|
|
// from this software without specific prior written permission.
|
|
|
|
//
|
|
|
|
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
|
|
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
|
|
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
|
|
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
|
|
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
|
|
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
|
|
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
|
|
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
|
|
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
|
|
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
|
|
|
|
#include <stdlib.h>
|
|
|
|
|
2021-08-23 13:01:06 +00:00
|
|
|
#include "include/v8-function.h"
|
2014-06-30 13:25:46 +00:00
|
|
|
#include "src/base/platform/platform.h"
|
2015-04-21 10:21:50 +00:00
|
|
|
#include "src/base/utils/random-number-generator.h"
|
2019-05-21 09:30:15 +00:00
|
|
|
#include "src/codegen/assembler-inl.h"
|
|
|
|
#include "src/codegen/macro-assembler.h"
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
#include "src/deoptimizer/deoptimizer.h"
|
2019-05-20 09:15:06 +00:00
|
|
|
#include "src/diagnostics/disassembler.h"
|
2018-04-09 19:11:22 +00:00
|
|
|
#include "src/heap/factory.h"
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
#include "src/init/v8.h"
|
2019-05-23 13:27:57 +00:00
|
|
|
#include "src/utils/ostreams.h"
|
2014-06-03 08:12:43 +00:00
|
|
|
#include "test/cctest/cctest.h"
|
2021-12-15 09:47:21 +00:00
|
|
|
#include "test/common/assembler-tester.h"
|
2008-08-22 13:33:59 +00:00
|
|
|
|
2017-08-31 12:34:55 +00:00
|
|
|
namespace v8 {
|
|
|
|
namespace internal {
|
2008-08-22 13:33:59 +00:00
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
using F0 = int();
|
|
|
|
using F1 = int(int x);
|
|
|
|
using F2 = int(int x, int y);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
#define __ assm.
|
|
|
|
|
|
|
|
TEST(AssemblerIa320) {
|
2013-04-10 08:29:39 +00:00
|
|
|
CcTest::InitializeVM();
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
2013-03-15 12:06:53 +00:00
|
|
|
HandleScope scope(isolate);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{},
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof buffer));
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
__ mov(eax, Operand(esp, 4));
|
|
|
|
__ add(eax, Operand(esp, 8));
|
|
|
|
__ ret(0);
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2011-01-03 09:32:42 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2008-08-22 13:33:59 +00:00
|
|
|
#endif
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F2>::FromCode(*code);
|
|
|
|
auto res = f.Call(3, 4);
|
2008-08-22 13:33:59 +00:00
|
|
|
::printf("f() = %d\n", res);
|
|
|
|
CHECK_EQ(7, res);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
TEST(AssemblerIa321) {
|
2013-04-10 08:29:39 +00:00
|
|
|
CcTest::InitializeVM();
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
2013-03-15 12:06:53 +00:00
|
|
|
HandleScope scope(isolate);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{},
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof buffer));
|
2008-08-22 13:33:59 +00:00
|
|
|
Label L, C;
|
|
|
|
|
|
|
|
__ mov(edx, Operand(esp, 4));
|
2011-10-03 11:44:39 +00:00
|
|
|
__ xor_(eax, eax); // clear eax
|
2008-08-22 13:33:59 +00:00
|
|
|
__ jmp(&C);
|
|
|
|
|
|
|
|
__ bind(&L);
|
2011-10-03 11:44:39 +00:00
|
|
|
__ add(eax, edx);
|
|
|
|
__ sub(edx, Immediate(1));
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
__ bind(&C);
|
2011-10-03 11:44:39 +00:00
|
|
|
__ test(edx, edx);
|
2011-05-11 13:26:07 +00:00
|
|
|
__ j(not_zero, &L);
|
2008-08-22 13:33:59 +00:00
|
|
|
__ ret(0);
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2011-01-03 09:32:42 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2008-08-22 13:33:59 +00:00
|
|
|
#endif
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F1>::FromCode(*code);
|
|
|
|
int res = f.Call(100);
|
2008-08-22 13:33:59 +00:00
|
|
|
::printf("f() = %d\n", res);
|
|
|
|
CHECK_EQ(5050, res);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
TEST(AssemblerIa322) {
|
2013-04-10 08:29:39 +00:00
|
|
|
CcTest::InitializeVM();
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
2013-03-15 12:06:53 +00:00
|
|
|
HandleScope scope(isolate);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{},
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof buffer));
|
2008-08-22 13:33:59 +00:00
|
|
|
Label L, C;
|
|
|
|
|
|
|
|
__ mov(edx, Operand(esp, 4));
|
|
|
|
__ mov(eax, 1);
|
|
|
|
__ jmp(&C);
|
|
|
|
|
|
|
|
__ bind(&L);
|
2011-10-03 11:44:39 +00:00
|
|
|
__ imul(eax, edx);
|
|
|
|
__ sub(edx, Immediate(1));
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
__ bind(&C);
|
2011-10-03 11:44:39 +00:00
|
|
|
__ test(edx, edx);
|
2011-05-11 13:26:07 +00:00
|
|
|
__ j(not_zero, &L);
|
2008-08-22 13:33:59 +00:00
|
|
|
__ ret(0);
|
|
|
|
|
|
|
|
// some relocated stuff here, not executed
|
2013-06-04 10:30:05 +00:00
|
|
|
__ mov(eax, isolate->factory()->true_value());
|
2018-04-13 22:28:05 +00:00
|
|
|
__ jmp(kNullAddress, RelocInfo::RUNTIME_ENTRY);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2011-01-03 09:32:42 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2008-08-22 13:33:59 +00:00
|
|
|
#endif
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F1>::FromCode(*code);
|
|
|
|
int res = f.Call(10);
|
2008-08-22 13:33:59 +00:00
|
|
|
::printf("f() = %d\n", res);
|
|
|
|
CHECK_EQ(3628800, res);
|
|
|
|
}
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
using F3 = int(float x);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
TEST(AssemblerIa323) {
|
2013-04-10 08:29:39 +00:00
|
|
|
CcTest::InitializeVM();
|
2011-03-31 16:17:37 +00:00
|
|
|
|
2013-04-10 08:29:39 +00:00
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
2013-03-15 12:06:53 +00:00
|
|
|
HandleScope scope(isolate);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{},
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof buffer));
|
2008-08-22 13:33:59 +00:00
|
|
|
|
2014-05-09 13:01:50 +00:00
|
|
|
__ cvttss2si(eax, Operand(esp, 4));
|
|
|
|
__ ret(0);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2014-09-25 08:33:24 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2014-09-25 08:33:24 +00:00
|
|
|
#endif
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F3>::FromCode(*code);
|
|
|
|
int res = f.Call(-3.1415f);
|
2008-08-22 13:33:59 +00:00
|
|
|
::printf("f() = %d\n", res);
|
|
|
|
CHECK_EQ(-3, res);
|
|
|
|
}
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
using F4 = int(double x);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
TEST(AssemblerIa324) {
|
2013-04-10 08:29:39 +00:00
|
|
|
CcTest::InitializeVM();
|
2011-03-31 16:17:37 +00:00
|
|
|
|
2013-04-10 08:29:39 +00:00
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
2013-03-15 12:06:53 +00:00
|
|
|
HandleScope scope(isolate);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{},
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof buffer));
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
__ cvttsd2si(eax, Operand(esp, 4));
|
|
|
|
__ ret(0);
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2014-09-25 08:33:24 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2014-09-25 08:33:24 +00:00
|
|
|
#endif
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F4>::FromCode(*code);
|
|
|
|
int res = f.Call(2.718281828);
|
2008-08-22 13:33:59 +00:00
|
|
|
::printf("f() = %d\n", res);
|
|
|
|
CHECK_EQ(2, res);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static int baz = 42;
|
|
|
|
TEST(AssemblerIa325) {
|
2013-04-10 08:29:39 +00:00
|
|
|
CcTest::InitializeVM();
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
2013-03-15 12:06:53 +00:00
|
|
|
HandleScope scope(isolate);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{},
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof buffer));
|
2008-08-22 13:33:59 +00:00
|
|
|
|
2021-11-17 18:14:02 +00:00
|
|
|
__ mov(eax, Operand(reinterpret_cast<intptr_t>(&baz), RelocInfo::NO_INFO));
|
2008-08-22 13:33:59 +00:00
|
|
|
__ ret(0);
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F0>::FromCode(*code);
|
|
|
|
int res = f.Call();
|
2008-08-22 13:33:59 +00:00
|
|
|
CHECK_EQ(42, res);
|
|
|
|
}
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
using F5 = double(double x, double y);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
TEST(AssemblerIa326) {
|
2013-04-10 08:29:39 +00:00
|
|
|
CcTest::InitializeVM();
|
2011-03-31 16:17:37 +00:00
|
|
|
|
2013-04-10 08:29:39 +00:00
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
2013-03-15 12:06:53 +00:00
|
|
|
HandleScope scope(isolate);
|
2008-08-22 13:33:59 +00:00
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{},
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof buffer));
|
2008-08-22 13:33:59 +00:00
|
|
|
|
2019-02-14 16:22:26 +00:00
|
|
|
__ movsd(xmm0, Operand(esp, 1 * kSystemPointerSize));
|
|
|
|
__ movsd(xmm1, Operand(esp, 3 * kSystemPointerSize));
|
2008-08-22 13:33:59 +00:00
|
|
|
__ addsd(xmm0, xmm1);
|
|
|
|
__ mulsd(xmm0, xmm1);
|
|
|
|
__ subsd(xmm0, xmm1);
|
|
|
|
__ divsd(xmm0, xmm1);
|
2008-09-01 06:41:12 +00:00
|
|
|
// Copy xmm0 to st(0) using eight bytes of stack.
|
2011-10-03 11:44:39 +00:00
|
|
|
__ sub(esp, Immediate(8));
|
2013-10-18 10:54:45 +00:00
|
|
|
__ movsd(Operand(esp, 0), xmm0);
|
2008-09-01 06:41:12 +00:00
|
|
|
__ fld_d(Operand(esp, 0));
|
2011-10-03 11:44:39 +00:00
|
|
|
__ add(esp, Immediate(8));
|
2008-08-22 13:33:59 +00:00
|
|
|
__ ret(0);
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2014-09-25 08:33:24 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2008-08-22 13:33:59 +00:00
|
|
|
#endif
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F5>::FromCode(*code);
|
|
|
|
double res = f.Call(2.2, 1.1);
|
2008-08-22 13:33:59 +00:00
|
|
|
::printf("f() = %f\n", res);
|
|
|
|
CHECK(2.29 < res && res < 2.31);
|
|
|
|
}
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
using F6 = double(int x);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
TEST(AssemblerIa328) {
|
2013-04-10 08:29:39 +00:00
|
|
|
CcTest::InitializeVM();
|
2011-03-31 16:17:37 +00:00
|
|
|
|
2013-04-10 08:29:39 +00:00
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
2013-03-15 12:06:53 +00:00
|
|
|
HandleScope scope(isolate);
|
2008-08-22 13:33:59 +00:00
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{},
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof buffer));
|
2008-08-22 13:33:59 +00:00
|
|
|
__ mov(eax, Operand(esp, 4));
|
2011-10-03 11:44:39 +00:00
|
|
|
__ cvtsi2sd(xmm0, eax);
|
2008-09-01 06:41:12 +00:00
|
|
|
// Copy xmm0 to st(0) using eight bytes of stack.
|
2011-10-03 11:44:39 +00:00
|
|
|
__ sub(esp, Immediate(8));
|
2013-10-18 10:54:45 +00:00
|
|
|
__ movsd(Operand(esp, 0), xmm0);
|
2008-09-01 06:41:12 +00:00
|
|
|
__ fld_d(Operand(esp, 0));
|
2011-10-03 11:44:39 +00:00
|
|
|
__ add(esp, Immediate(8));
|
2008-08-22 13:33:59 +00:00
|
|
|
__ ret(0);
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2011-01-03 09:32:42 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2008-08-22 13:33:59 +00:00
|
|
|
#endif
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F6>::FromCode(*code);
|
|
|
|
double res = f.Call(12);
|
2008-08-22 13:33:59 +00:00
|
|
|
|
|
|
|
::printf("f() = %f\n", res);
|
|
|
|
CHECK(11.99 < res && res < 12.001);
|
|
|
|
}
|
|
|
|
|
2011-08-30 07:36:31 +00:00
|
|
|
TEST(AssemblerIa3210) {
|
|
|
|
// Test chaining of label usages within instructions (issue 1644).
|
2013-04-10 08:29:39 +00:00
|
|
|
CcTest::InitializeVM();
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
2013-03-15 12:06:53 +00:00
|
|
|
HandleScope scope(isolate);
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{});
|
2011-08-30 07:36:31 +00:00
|
|
|
|
|
|
|
Label target;
|
|
|
|
__ j(equal, &target);
|
|
|
|
__ j(not_equal, &target);
|
|
|
|
__ bind(&target);
|
|
|
|
__ nop();
|
|
|
|
}
|
|
|
|
|
2011-12-02 10:01:50 +00:00
|
|
|
|
|
|
|
TEST(AssemblerMultiByteNop) {
|
2013-04-10 08:29:39 +00:00
|
|
|
CcTest::InitializeVM();
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
2013-03-15 12:06:53 +00:00
|
|
|
HandleScope scope(isolate);
|
2011-12-02 10:01:50 +00:00
|
|
|
v8::internal::byte buffer[1024];
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{},
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof(buffer)));
|
2011-12-02 10:01:50 +00:00
|
|
|
__ push(ebx);
|
|
|
|
__ push(ecx);
|
|
|
|
__ push(edx);
|
|
|
|
__ push(edi);
|
|
|
|
__ push(esi);
|
|
|
|
__ mov(eax, 1);
|
|
|
|
__ mov(ebx, 2);
|
|
|
|
__ mov(ecx, 3);
|
|
|
|
__ mov(edx, 4);
|
|
|
|
__ mov(edi, 5);
|
|
|
|
__ mov(esi, 6);
|
|
|
|
for (int i = 0; i < 16; i++) {
|
|
|
|
int before = assm.pc_offset();
|
|
|
|
__ Nop(i);
|
|
|
|
CHECK_EQ(assm.pc_offset() - before, i);
|
|
|
|
}
|
|
|
|
|
|
|
|
Label fail;
|
|
|
|
__ cmp(eax, 1);
|
|
|
|
__ j(not_equal, &fail);
|
|
|
|
__ cmp(ebx, 2);
|
|
|
|
__ j(not_equal, &fail);
|
|
|
|
__ cmp(ecx, 3);
|
|
|
|
__ j(not_equal, &fail);
|
|
|
|
__ cmp(edx, 4);
|
|
|
|
__ j(not_equal, &fail);
|
|
|
|
__ cmp(edi, 5);
|
|
|
|
__ j(not_equal, &fail);
|
|
|
|
__ cmp(esi, 6);
|
|
|
|
__ j(not_equal, &fail);
|
|
|
|
__ mov(eax, 42);
|
|
|
|
__ pop(esi);
|
|
|
|
__ pop(edi);
|
|
|
|
__ pop(edx);
|
|
|
|
__ pop(ecx);
|
|
|
|
__ pop(ebx);
|
|
|
|
__ ret(0);
|
|
|
|
__ bind(&fail);
|
|
|
|
__ mov(eax, 13);
|
|
|
|
__ pop(esi);
|
|
|
|
__ pop(edi);
|
|
|
|
__ pop(edx);
|
|
|
|
__ pop(ecx);
|
|
|
|
__ pop(ebx);
|
|
|
|
__ ret(0);
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2011-12-02 10:01:50 +00:00
|
|
|
CHECK(code->IsCode());
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F0>::FromCode(*code);
|
|
|
|
int res = f.Call();
|
2011-12-02 10:01:50 +00:00
|
|
|
CHECK_EQ(42, res);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2013-07-29 12:12:39 +00:00
|
|
|
#ifdef __GNUC__
|
2015-01-30 09:29:25 +00:00
|
|
|
#define ELEMENT_COUNT 4u
|
2013-07-05 08:34:17 +00:00
|
|
|
|
|
|
|
void DoSSE2(const v8::FunctionCallbackInfo<v8::Value>& args) {
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
2015-11-20 09:29:26 +00:00
|
|
|
v8::Local<v8::Context> context = CcTest::isolate()->GetCurrentContext();
|
2013-07-05 08:34:17 +00:00
|
|
|
|
|
|
|
CHECK(args[0]->IsArray());
|
|
|
|
v8::Local<v8::Array> vec = v8::Local<v8::Array>::Cast(args[0]);
|
|
|
|
CHECK_EQ(ELEMENT_COUNT, vec->Length());
|
|
|
|
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{},
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof buffer));
|
2013-07-05 08:34:17 +00:00
|
|
|
|
|
|
|
// Remove return address from the stack for fix stack frame alignment.
|
|
|
|
__ pop(ecx);
|
|
|
|
|
|
|
|
// Store input vector on the stack.
|
2015-01-30 09:29:25 +00:00
|
|
|
for (unsigned i = 0; i < ELEMENT_COUNT; ++i) {
|
2015-11-20 09:29:26 +00:00
|
|
|
__ push(Immediate(
|
|
|
|
vec->Get(context, i).ToLocalChecked()->Int32Value(context).FromJust()));
|
2013-07-05 08:34:17 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Read vector into a xmm register.
|
|
|
|
__ pxor(xmm0, xmm0);
|
|
|
|
__ movdqa(xmm0, Operand(esp, 0));
|
|
|
|
// Create mask and store it in the return register.
|
|
|
|
__ movmskps(eax, xmm0);
|
|
|
|
|
|
|
|
// Remove unused data from the stack.
|
|
|
|
__ add(esp, Immediate(ELEMENT_COUNT * sizeof(int32_t)));
|
|
|
|
// Restore return address.
|
|
|
|
__ push(ecx);
|
|
|
|
|
|
|
|
__ ret(0);
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
2013-07-05 08:34:17 +00:00
|
|
|
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2013-07-05 08:34:17 +00:00
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F0>::FromCode(*code);
|
|
|
|
int res = f.Call();
|
2014-01-03 14:31:17 +00:00
|
|
|
args.GetReturnValue().Set(v8::Integer::New(CcTest::isolate(), res));
|
2013-07-05 08:34:17 +00:00
|
|
|
}
|
|
|
|
|
2013-07-05 09:52:11 +00:00
|
|
|
|
2013-07-05 08:34:17 +00:00
|
|
|
TEST(StackAlignmentForSSE2) {
|
|
|
|
CcTest::InitializeVM();
|
2014-06-30 13:25:46 +00:00
|
|
|
CHECK_EQ(0, v8::base::OS::ActivationFrameAlignment() % 16);
|
2013-07-05 08:34:17 +00:00
|
|
|
|
2013-09-19 08:54:58 +00:00
|
|
|
v8::Isolate* isolate = CcTest::isolate();
|
2013-07-05 08:34:17 +00:00
|
|
|
v8::HandleScope handle_scope(isolate);
|
2015-11-20 09:29:26 +00:00
|
|
|
v8::Local<v8::ObjectTemplate> global_template =
|
2014-01-08 06:53:31 +00:00
|
|
|
v8::ObjectTemplate::New(isolate);
|
2013-12-18 10:31:42 +00:00
|
|
|
global_template->Set(v8_str("do_sse2"),
|
|
|
|
v8::FunctionTemplate::New(isolate, DoSSE2));
|
2013-07-05 08:34:17 +00:00
|
|
|
|
2017-10-13 16:33:03 +00:00
|
|
|
LocalContext env(nullptr, global_template);
|
2013-07-05 08:34:17 +00:00
|
|
|
CompileRun(
|
|
|
|
"function foo(vec) {"
|
|
|
|
" return do_sse2(vec);"
|
|
|
|
"}");
|
|
|
|
|
|
|
|
v8::Local<v8::Object> global_object = env->Global();
|
2015-11-20 09:29:26 +00:00
|
|
|
v8::Local<v8::Function> foo = v8::Local<v8::Function>::Cast(
|
|
|
|
global_object->Get(env.local(), v8_str("foo")).ToLocalChecked());
|
2013-07-05 08:34:17 +00:00
|
|
|
|
|
|
|
int32_t vec[ELEMENT_COUNT] = { -1, 1, 1, 1 };
|
2013-11-28 08:21:26 +00:00
|
|
|
v8::Local<v8::Array> v8_vec = v8::Array::New(isolate, ELEMENT_COUNT);
|
2015-01-30 09:29:25 +00:00
|
|
|
for (unsigned i = 0; i < ELEMENT_COUNT; i++) {
|
2015-11-20 09:29:26 +00:00
|
|
|
v8_vec->Set(env.local(), i, v8_num(vec[i])).FromJust();
|
2013-07-05 08:34:17 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
v8::Local<v8::Value> args[] = { v8_vec };
|
2015-11-20 09:29:26 +00:00
|
|
|
v8::Local<v8::Value> result =
|
|
|
|
foo->Call(env.local(), global_object, 1, args).ToLocalChecked();
|
2013-07-05 08:34:17 +00:00
|
|
|
|
|
|
|
// The mask should be 0b1000.
|
2015-11-20 09:29:26 +00:00
|
|
|
CHECK_EQ(8, result->Int32Value(env.local()).FromJust());
|
2013-07-05 08:34:17 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#undef ELEMENT_COUNT
|
2013-07-29 12:12:39 +00:00
|
|
|
#endif // __GNUC__
|
2011-12-02 10:01:50 +00:00
|
|
|
|
|
|
|
|
2013-10-15 12:51:58 +00:00
|
|
|
TEST(AssemblerIa32Extractps) {
|
|
|
|
CcTest::InitializeVM();
|
2014-05-09 13:01:50 +00:00
|
|
|
if (!CpuFeatures::IsSupported(SSE4_1)) return;
|
2013-10-15 12:51:58 +00:00
|
|
|
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
MacroAssembler assm(isolate, v8::internal::CodeObjectRequired::kYes,
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof(buffer)));
|
2014-05-09 13:01:50 +00:00
|
|
|
{ CpuFeatureScope fscope41(&assm, SSE4_1);
|
2013-10-18 10:54:45 +00:00
|
|
|
__ movsd(xmm1, Operand(esp, 4));
|
2013-10-15 12:51:58 +00:00
|
|
|
__ extractps(eax, xmm1, 0x1);
|
|
|
|
__ ret(0);
|
|
|
|
}
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2013-10-15 12:51:58 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2013-10-15 12:51:58 +00:00
|
|
|
#endif
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F4>::FromCode(*code);
|
2020-07-20 10:55:02 +00:00
|
|
|
uint64_t value1 = 0x1234'5678'8765'4321;
|
2021-12-15 09:47:21 +00:00
|
|
|
CHECK_EQ(0x12345678, f.Call(base::uint64_to_double(value1)));
|
2020-07-20 10:55:02 +00:00
|
|
|
uint64_t value2 = 0x8765'4321'1234'5678;
|
2021-12-15 09:47:21 +00:00
|
|
|
CHECK_EQ(static_cast<int>(0x87654321),
|
|
|
|
f.Call(base::uint64_to_double(value2)));
|
2013-10-15 12:51:58 +00:00
|
|
|
}
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
using F8 = int(float x, float y);
|
2013-11-18 15:24:41 +00:00
|
|
|
TEST(AssemblerIa32SSE) {
|
|
|
|
CcTest::InitializeVM();
|
|
|
|
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
MacroAssembler assm(isolate, v8::internal::CodeObjectRequired::kYes,
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof(buffer)));
|
2013-11-18 15:24:41 +00:00
|
|
|
{
|
2019-02-14 16:22:26 +00:00
|
|
|
__ movss(xmm0, Operand(esp, kSystemPointerSize));
|
|
|
|
__ movss(xmm1, Operand(esp, 2 * kSystemPointerSize));
|
2013-11-18 15:24:41 +00:00
|
|
|
__ shufps(xmm0, xmm0, 0x0);
|
|
|
|
__ shufps(xmm1, xmm1, 0x0);
|
|
|
|
__ movaps(xmm2, xmm1);
|
|
|
|
__ addps(xmm2, xmm0);
|
|
|
|
__ mulps(xmm2, xmm1);
|
|
|
|
__ subps(xmm2, xmm0);
|
|
|
|
__ divps(xmm2, xmm1);
|
|
|
|
__ cvttss2si(eax, xmm2);
|
|
|
|
__ ret(0);
|
|
|
|
}
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2013-11-18 15:24:41 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2013-11-18 15:24:41 +00:00
|
|
|
#endif
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F8>::FromCode(*code);
|
|
|
|
CHECK_EQ(2, f.Call(1.0, 2.0));
|
2013-11-18 15:24:41 +00:00
|
|
|
}
|
|
|
|
|
2018-02-28 06:28:08 +00:00
|
|
|
TEST(AssemblerIa32SSE3) {
|
|
|
|
CcTest::InitializeVM();
|
|
|
|
if (!CpuFeatures::IsSupported(SSE3)) return;
|
|
|
|
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
MacroAssembler assm(isolate, v8::internal::CodeObjectRequired::kYes,
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof(buffer)));
|
2018-02-28 06:28:08 +00:00
|
|
|
{
|
|
|
|
CpuFeatureScope fscope(&assm, SSE3);
|
2019-02-14 16:22:26 +00:00
|
|
|
__ movss(xmm0, Operand(esp, kSystemPointerSize));
|
|
|
|
__ movss(xmm1, Operand(esp, 2 * kSystemPointerSize));
|
2018-02-28 06:28:08 +00:00
|
|
|
__ shufps(xmm0, xmm0, 0x0);
|
|
|
|
__ shufps(xmm1, xmm1, 0x0);
|
|
|
|
__ haddps(xmm1, xmm0);
|
|
|
|
__ cvttss2si(eax, xmm1);
|
|
|
|
__ ret(0);
|
|
|
|
}
|
|
|
|
|
|
|
|
CodeDesc desc;
|
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2018-02-28 06:28:08 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2018-02-28 06:28:08 +00:00
|
|
|
#endif
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F8>::FromCode(*code);
|
|
|
|
CHECK_EQ(4, f.Call(1.0, 2.0));
|
2018-02-28 06:28:08 +00:00
|
|
|
}
|
2013-11-18 15:24:41 +00:00
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
using F9 = int(double x, double y, double z);
|
2014-12-02 15:30:03 +00:00
|
|
|
TEST(AssemblerX64FMA_sd) {
|
|
|
|
CcTest::InitializeVM();
|
|
|
|
if (!CpuFeatures::IsSupported(FMA3)) return;
|
|
|
|
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
|
|
|
v8::internal::byte buffer[1024];
|
2019-01-16 18:29:52 +00:00
|
|
|
MacroAssembler assm(isolate, v8::internal::CodeObjectRequired::kYes,
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof(buffer)));
|
2014-12-02 15:30:03 +00:00
|
|
|
{
|
|
|
|
CpuFeatureScope fscope(&assm, FMA3);
|
|
|
|
Label exit;
|
2019-02-14 16:22:26 +00:00
|
|
|
__ movsd(xmm0, Operand(esp, 1 * kSystemPointerSize));
|
|
|
|
__ movsd(xmm1, Operand(esp, 3 * kSystemPointerSize));
|
|
|
|
__ movsd(xmm2, Operand(esp, 5 * kSystemPointerSize));
|
2014-12-02 15:30:03 +00:00
|
|
|
// argument in xmm0, xmm1 and xmm2
|
|
|
|
// xmm0 * xmm1 + xmm2
|
|
|
|
__ movaps(xmm3, xmm0);
|
|
|
|
__ mulsd(xmm3, xmm1);
|
|
|
|
__ addsd(xmm3, xmm2); // Expected result in xmm3
|
|
|
|
|
2019-05-02 17:02:14 +00:00
|
|
|
__ AllocateStackSpace(kDoubleSize); // For memory operand
|
2014-12-02 15:30:03 +00:00
|
|
|
// vfmadd132sd
|
|
|
|
__ mov(eax, Immediate(1)); // Test number
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ vfmadd132sd(xmm4, xmm2, xmm1);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd213sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ vfmadd213sd(xmm4, xmm0, xmm2);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd231sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ vfmadd231sd(xmm4, xmm0, xmm1);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// vfmadd132sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ movsd(Operand(esp, 0), xmm1);
|
|
|
|
__ vfmadd132sd(xmm4, xmm2, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd213sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ movsd(Operand(esp, 0), xmm2);
|
|
|
|
__ vfmadd213sd(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd231sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ movsd(Operand(esp, 0), xmm1);
|
|
|
|
__ vfmadd231sd(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// xmm0 * xmm1 - xmm2
|
|
|
|
__ movaps(xmm3, xmm0);
|
|
|
|
__ mulsd(xmm3, xmm1);
|
|
|
|
__ subsd(xmm3, xmm2); // Expected result in xmm3
|
|
|
|
|
|
|
|
// vfmsub132sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ vfmsub132sd(xmm4, xmm2, xmm1);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd213sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ vfmsub213sd(xmm4, xmm0, xmm2);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmsub231sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ vfmsub231sd(xmm4, xmm0, xmm1);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// vfmsub132sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ movsd(Operand(esp, 0), xmm1);
|
|
|
|
__ vfmsub132sd(xmm4, xmm2, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmsub213sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ movsd(Operand(esp, 0), xmm2);
|
|
|
|
__ vfmsub213sd(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmsub231sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ movsd(Operand(esp, 0), xmm1);
|
|
|
|
__ vfmsub231sd(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
|
|
|
|
// - xmm0 * xmm1 + xmm2
|
|
|
|
__ movaps(xmm3, xmm0);
|
|
|
|
__ mulsd(xmm3, xmm1);
|
|
|
|
__ Move(xmm4, (uint64_t)1 << 63);
|
|
|
|
__ xorpd(xmm3, xmm4);
|
|
|
|
__ addsd(xmm3, xmm2); // Expected result in xmm3
|
|
|
|
|
|
|
|
// vfnmadd132sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ vfnmadd132sd(xmm4, xmm2, xmm1);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd213sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ vfnmadd213sd(xmm4, xmm0, xmm2);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmadd231sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ vfnmadd231sd(xmm4, xmm0, xmm1);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// vfnmadd132sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ movsd(Operand(esp, 0), xmm1);
|
|
|
|
__ vfnmadd132sd(xmm4, xmm2, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmadd213sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ movsd(Operand(esp, 0), xmm2);
|
|
|
|
__ vfnmadd213sd(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmadd231sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ movsd(Operand(esp, 0), xmm1);
|
|
|
|
__ vfnmadd231sd(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
|
|
|
|
// - xmm0 * xmm1 - xmm2
|
|
|
|
__ movaps(xmm3, xmm0);
|
|
|
|
__ mulsd(xmm3, xmm1);
|
|
|
|
__ Move(xmm4, (uint64_t)1 << 63);
|
|
|
|
__ xorpd(xmm3, xmm4);
|
|
|
|
__ subsd(xmm3, xmm2); // Expected result in xmm3
|
|
|
|
|
|
|
|
// vfnmsub132sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ vfnmsub132sd(xmm4, xmm2, xmm1);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmsub213sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ vfnmsub213sd(xmm4, xmm0, xmm2);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmsub231sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ vfnmsub231sd(xmm4, xmm0, xmm1);
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// vfnmsub132sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ movsd(Operand(esp, 0), xmm1);
|
|
|
|
__ vfnmsub132sd(xmm4, xmm2, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmsub213sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ movsd(Operand(esp, 0), xmm2);
|
|
|
|
__ vfnmsub213sd(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmsub231sd
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ movsd(Operand(esp, 0), xmm1);
|
|
|
|
__ vfnmsub231sd(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomisd(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
|
|
|
|
__ xor_(eax, eax);
|
|
|
|
__ bind(&exit);
|
|
|
|
__ add(esp, Immediate(kDoubleSize));
|
|
|
|
__ ret(0);
|
|
|
|
}
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2014-12-02 15:30:03 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2014-12-02 15:30:03 +00:00
|
|
|
#endif
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F9>::FromCode(*code);
|
|
|
|
CHECK_EQ(
|
|
|
|
0, f.Call(0.000092662107262076, -2.460774966188315, -1.0958787393627414));
|
2014-12-02 15:30:03 +00:00
|
|
|
}
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
using F10 = int(float x, float y, float z);
|
2014-12-02 15:30:03 +00:00
|
|
|
TEST(AssemblerX64FMA_ss) {
|
|
|
|
CcTest::InitializeVM();
|
|
|
|
if (!CpuFeatures::IsSupported(FMA3)) return;
|
|
|
|
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
|
|
|
v8::internal::byte buffer[1024];
|
2019-01-16 18:29:52 +00:00
|
|
|
MacroAssembler assm(isolate, v8::internal::CodeObjectRequired::kYes,
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof(buffer)));
|
2014-12-02 15:30:03 +00:00
|
|
|
{
|
|
|
|
CpuFeatureScope fscope(&assm, FMA3);
|
|
|
|
Label exit;
|
2019-02-14 16:22:26 +00:00
|
|
|
__ movss(xmm0, Operand(esp, 1 * kSystemPointerSize));
|
|
|
|
__ movss(xmm1, Operand(esp, 2 * kSystemPointerSize));
|
|
|
|
__ movss(xmm2, Operand(esp, 3 * kSystemPointerSize));
|
2014-12-02 15:30:03 +00:00
|
|
|
// arguments in xmm0, xmm1 and xmm2
|
|
|
|
// xmm0 * xmm1 + xmm2
|
|
|
|
__ movaps(xmm3, xmm0);
|
|
|
|
__ mulss(xmm3, xmm1);
|
|
|
|
__ addss(xmm3, xmm2); // Expected result in xmm3
|
|
|
|
|
2019-05-02 17:02:14 +00:00
|
|
|
__ AllocateStackSpace(kDoubleSize); // For memory operand
|
2014-12-02 15:30:03 +00:00
|
|
|
// vfmadd132ss
|
|
|
|
__ mov(eax, Immediate(1)); // Test number
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ vfmadd132ss(xmm4, xmm2, xmm1);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd213ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ vfmadd213ss(xmm4, xmm0, xmm2);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd231ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ vfmadd231ss(xmm4, xmm0, xmm1);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// vfmadd132ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ movss(Operand(esp, 0), xmm1);
|
|
|
|
__ vfmadd132ss(xmm4, xmm2, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd213ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ movss(Operand(esp, 0), xmm2);
|
|
|
|
__ vfmadd213ss(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd231ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ movss(Operand(esp, 0), xmm1);
|
|
|
|
__ vfmadd231ss(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// xmm0 * xmm1 - xmm2
|
|
|
|
__ movaps(xmm3, xmm0);
|
|
|
|
__ mulss(xmm3, xmm1);
|
|
|
|
__ subss(xmm3, xmm2); // Expected result in xmm3
|
|
|
|
|
|
|
|
// vfmsub132ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ vfmsub132ss(xmm4, xmm2, xmm1);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd213ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ vfmsub213ss(xmm4, xmm0, xmm2);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmsub231ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ vfmsub231ss(xmm4, xmm0, xmm1);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// vfmsub132ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ movss(Operand(esp, 0), xmm1);
|
|
|
|
__ vfmsub132ss(xmm4, xmm2, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmsub213ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ movss(Operand(esp, 0), xmm2);
|
|
|
|
__ vfmsub213ss(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmsub231ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ movss(Operand(esp, 0), xmm1);
|
|
|
|
__ vfmsub231ss(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
|
|
|
|
// - xmm0 * xmm1 + xmm2
|
|
|
|
__ movaps(xmm3, xmm0);
|
|
|
|
__ mulss(xmm3, xmm1);
|
|
|
|
__ Move(xmm4, (uint32_t)1 << 31);
|
|
|
|
__ xorps(xmm3, xmm4);
|
|
|
|
__ addss(xmm3, xmm2); // Expected result in xmm3
|
|
|
|
|
|
|
|
// vfnmadd132ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ vfnmadd132ss(xmm4, xmm2, xmm1);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmadd213ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ vfnmadd213ss(xmm4, xmm0, xmm2);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmadd231ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ vfnmadd231ss(xmm4, xmm0, xmm1);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// vfnmadd132ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ movss(Operand(esp, 0), xmm1);
|
|
|
|
__ vfnmadd132ss(xmm4, xmm2, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmadd213ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ movss(Operand(esp, 0), xmm2);
|
|
|
|
__ vfnmadd213ss(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmadd231ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ movss(Operand(esp, 0), xmm1);
|
|
|
|
__ vfnmadd231ss(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
|
|
|
|
// - xmm0 * xmm1 - xmm2
|
|
|
|
__ movaps(xmm3, xmm0);
|
|
|
|
__ mulss(xmm3, xmm1);
|
|
|
|
__ Move(xmm4, (uint32_t)1 << 31);
|
|
|
|
__ xorps(xmm3, xmm4);
|
|
|
|
__ subss(xmm3, xmm2); // Expected result in xmm3
|
|
|
|
|
|
|
|
// vfnmsub132ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ vfnmsub132ss(xmm4, xmm2, xmm1);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfmsub213ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ vfnmsub213ss(xmm4, xmm0, xmm2);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmsub231ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ vfnmsub231ss(xmm4, xmm0, xmm1);
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// vfnmsub132ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm0);
|
|
|
|
__ movss(Operand(esp, 0), xmm1);
|
|
|
|
__ vfnmsub132ss(xmm4, xmm2, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmsub213ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm1);
|
|
|
|
__ movss(Operand(esp, 0), xmm2);
|
|
|
|
__ vfnmsub213ss(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
// vfnmsub231ss
|
|
|
|
__ inc(eax);
|
|
|
|
__ movaps(xmm4, xmm2);
|
|
|
|
__ movss(Operand(esp, 0), xmm1);
|
|
|
|
__ vfnmsub231ss(xmm4, xmm0, Operand(esp, 0));
|
|
|
|
__ ucomiss(xmm4, xmm3);
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
|
|
|
|
__ xor_(eax, eax);
|
|
|
|
__ bind(&exit);
|
|
|
|
__ add(esp, Immediate(kDoubleSize));
|
|
|
|
__ ret(0);
|
|
|
|
}
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2014-12-02 15:30:03 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2014-12-02 15:30:03 +00:00
|
|
|
#endif
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F10>::FromCode(*code);
|
|
|
|
CHECK_EQ(0, f.Call(9.26621069e-05f, -2.4607749f, -1.09587872f));
|
2014-12-02 15:30:03 +00:00
|
|
|
}
|
2015-02-06 08:51:39 +00:00
|
|
|
|
|
|
|
|
2015-04-09 06:50:52 +00:00
|
|
|
TEST(AssemblerIa32BMI1) {
|
|
|
|
CcTest::InitializeVM();
|
|
|
|
if (!CpuFeatures::IsSupported(BMI1)) return;
|
|
|
|
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
|
|
|
v8::internal::byte buffer[1024];
|
2019-01-16 18:29:52 +00:00
|
|
|
MacroAssembler assm(isolate, v8::internal::CodeObjectRequired::kYes,
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof(buffer)));
|
2015-04-09 06:50:52 +00:00
|
|
|
{
|
|
|
|
CpuFeatureScope fscope(&assm, BMI1);
|
|
|
|
Label exit;
|
|
|
|
|
|
|
|
__ push(ebx); // save ebx
|
|
|
|
__ mov(ecx, Immediate(0x55667788u)); // source operand
|
|
|
|
__ push(ecx); // For memory operand
|
|
|
|
|
|
|
|
// andn
|
|
|
|
__ mov(edx, Immediate(0x20000000u));
|
|
|
|
|
|
|
|
__ mov(eax, Immediate(1)); // Test number
|
|
|
|
__ andn(ebx, edx, ecx);
|
|
|
|
__ cmp(ebx, Immediate(0x55667788u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ andn(ebx, edx, Operand(esp, 0));
|
|
|
|
__ cmp(ebx, Immediate(0x55667788u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// bextr
|
|
|
|
__ mov(edx, Immediate(0x00002808u));
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ bextr(ebx, ecx, edx);
|
|
|
|
__ cmp(ebx, Immediate(0x00556677u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ bextr(ebx, Operand(esp, 0), edx);
|
|
|
|
__ cmp(ebx, Immediate(0x00556677u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// blsi
|
|
|
|
__ inc(eax);
|
|
|
|
__ blsi(ebx, ecx);
|
|
|
|
__ cmp(ebx, Immediate(0x00000008u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ blsi(ebx, Operand(esp, 0));
|
|
|
|
__ cmp(ebx, Immediate(0x00000008u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// blsmsk
|
|
|
|
__ inc(eax);
|
|
|
|
__ blsmsk(ebx, ecx);
|
2017-12-02 00:30:37 +00:00
|
|
|
__ cmp(ebx, Immediate(0x0000000Fu)); // expected result
|
2015-04-09 06:50:52 +00:00
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ blsmsk(ebx, Operand(esp, 0));
|
2017-12-02 00:30:37 +00:00
|
|
|
__ cmp(ebx, Immediate(0x0000000Fu)); // expected result
|
2015-04-09 06:50:52 +00:00
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// blsr
|
|
|
|
__ inc(eax);
|
|
|
|
__ blsr(ebx, ecx);
|
|
|
|
__ cmp(ebx, Immediate(0x55667780u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ blsr(ebx, Operand(esp, 0));
|
|
|
|
__ cmp(ebx, Immediate(0x55667780u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// tzcnt
|
|
|
|
__ inc(eax);
|
|
|
|
__ tzcnt(ebx, ecx);
|
|
|
|
__ cmp(ebx, Immediate(3)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ tzcnt(ebx, Operand(esp, 0));
|
|
|
|
__ cmp(ebx, Immediate(3)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ xor_(eax, eax);
|
|
|
|
__ bind(&exit);
|
|
|
|
__ pop(ecx);
|
|
|
|
__ pop(ebx);
|
|
|
|
__ ret(0);
|
|
|
|
}
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2015-04-09 06:50:52 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2015-04-09 06:50:52 +00:00
|
|
|
#endif
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F0>::FromCode(*code);
|
|
|
|
CHECK_EQ(0, f.Call());
|
2015-04-09 06:50:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
TEST(AssemblerIa32LZCNT) {
|
|
|
|
CcTest::InitializeVM();
|
|
|
|
if (!CpuFeatures::IsSupported(LZCNT)) return;
|
|
|
|
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
MacroAssembler assm(isolate, v8::internal::CodeObjectRequired::kYes,
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof(buffer)));
|
2015-04-09 06:50:52 +00:00
|
|
|
{
|
|
|
|
CpuFeatureScope fscope(&assm, LZCNT);
|
|
|
|
Label exit;
|
|
|
|
|
|
|
|
__ push(ebx); // save ebx
|
|
|
|
__ mov(ecx, Immediate(0x55667788u)); // source operand
|
|
|
|
__ push(ecx); // For memory operand
|
|
|
|
|
|
|
|
__ mov(eax, Immediate(1)); // Test number
|
|
|
|
__ lzcnt(ebx, ecx);
|
|
|
|
__ cmp(ebx, Immediate(1)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ lzcnt(ebx, Operand(esp, 0));
|
|
|
|
__ cmp(ebx, Immediate(1)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ xor_(eax, eax);
|
|
|
|
__ bind(&exit);
|
|
|
|
__ pop(ecx);
|
|
|
|
__ pop(ebx);
|
|
|
|
__ ret(0);
|
|
|
|
}
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2015-04-09 06:50:52 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2015-04-09 06:50:52 +00:00
|
|
|
#endif
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F0>::FromCode(*code);
|
|
|
|
CHECK_EQ(0, f.Call());
|
2015-04-09 06:50:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
TEST(AssemblerIa32POPCNT) {
|
|
|
|
CcTest::InitializeVM();
|
|
|
|
if (!CpuFeatures::IsSupported(POPCNT)) return;
|
|
|
|
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
|
|
|
v8::internal::byte buffer[256];
|
2019-01-16 18:29:52 +00:00
|
|
|
MacroAssembler assm(isolate, v8::internal::CodeObjectRequired::kYes,
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof(buffer)));
|
2015-04-09 06:50:52 +00:00
|
|
|
{
|
|
|
|
CpuFeatureScope fscope(&assm, POPCNT);
|
|
|
|
Label exit;
|
|
|
|
|
|
|
|
__ push(ebx); // save ebx
|
|
|
|
__ mov(ecx, Immediate(0x11111100u)); // source operand
|
|
|
|
__ push(ecx); // For memory operand
|
|
|
|
|
|
|
|
__ mov(eax, Immediate(1)); // Test number
|
|
|
|
__ popcnt(ebx, ecx);
|
|
|
|
__ cmp(ebx, Immediate(6)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ popcnt(ebx, Operand(esp, 0));
|
|
|
|
__ cmp(ebx, Immediate(6)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ xor_(eax, eax);
|
|
|
|
__ bind(&exit);
|
|
|
|
__ pop(ecx);
|
|
|
|
__ pop(ebx);
|
|
|
|
__ ret(0);
|
|
|
|
}
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2015-04-09 06:50:52 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2015-04-09 06:50:52 +00:00
|
|
|
#endif
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F0>::FromCode(*code);
|
|
|
|
CHECK_EQ(0, f.Call());
|
2015-04-09 06:50:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
TEST(AssemblerIa32BMI2) {
|
|
|
|
CcTest::InitializeVM();
|
|
|
|
if (!CpuFeatures::IsSupported(BMI2)) return;
|
|
|
|
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
|
|
|
v8::internal::byte buffer[2048];
|
2019-01-16 18:29:52 +00:00
|
|
|
MacroAssembler assm(isolate, v8::internal::CodeObjectRequired::kYes,
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof(buffer)));
|
2015-04-09 06:50:52 +00:00
|
|
|
{
|
|
|
|
CpuFeatureScope fscope(&assm, BMI2);
|
|
|
|
Label exit;
|
|
|
|
|
|
|
|
__ push(ebx); // save ebx
|
|
|
|
__ push(esi); // save esi
|
|
|
|
__ mov(ecx, Immediate(0x55667788u)); // source operand
|
|
|
|
__ push(ecx); // For memory operand
|
|
|
|
|
|
|
|
// bzhi
|
|
|
|
__ mov(edx, Immediate(9));
|
|
|
|
|
|
|
|
__ mov(eax, Immediate(1)); // Test number
|
|
|
|
__ bzhi(ebx, ecx, edx);
|
|
|
|
__ cmp(ebx, Immediate(0x00000188u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ bzhi(ebx, Operand(esp, 0), edx);
|
|
|
|
__ cmp(ebx, Immediate(0x00000188u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// mulx
|
|
|
|
__ mov(edx, Immediate(0x00001000u));
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ mulx(ebx, esi, ecx);
|
|
|
|
__ cmp(ebx, Immediate(0x00000556u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
__ cmp(esi, Immediate(0x67788000u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ mulx(ebx, esi, Operand(esp, 0));
|
|
|
|
__ cmp(ebx, Immediate(0x00000556u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
__ cmp(esi, Immediate(0x67788000u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// pdep
|
2017-12-02 00:30:37 +00:00
|
|
|
__ mov(edx, Immediate(0xFFFFFFF0u));
|
2015-04-09 06:50:52 +00:00
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ pdep(ebx, edx, ecx);
|
|
|
|
__ cmp(ebx, Immediate(0x55667400u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ pdep(ebx, edx, Operand(esp, 0));
|
|
|
|
__ cmp(ebx, Immediate(0x55667400u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// pext
|
2017-12-02 00:30:37 +00:00
|
|
|
__ mov(edx, Immediate(0xFFFFFFF0u));
|
2015-04-09 06:50:52 +00:00
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ pext(ebx, edx, ecx);
|
2017-12-02 00:30:37 +00:00
|
|
|
__ cmp(ebx, Immediate(0x0000FFFEu)); // expected result
|
2015-04-09 06:50:52 +00:00
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ pext(ebx, edx, Operand(esp, 0));
|
2017-12-02 00:30:37 +00:00
|
|
|
__ cmp(ebx, Immediate(0x0000FFFEu)); // expected result
|
2015-04-09 06:50:52 +00:00
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// sarx
|
|
|
|
__ mov(edx, Immediate(4));
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ sarx(ebx, ecx, edx);
|
|
|
|
__ cmp(ebx, Immediate(0x05566778u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ sarx(ebx, Operand(esp, 0), edx);
|
|
|
|
__ cmp(ebx, Immediate(0x05566778u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// shlx
|
|
|
|
__ mov(edx, Immediate(4));
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ shlx(ebx, ecx, edx);
|
|
|
|
__ cmp(ebx, Immediate(0x56677880u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ shlx(ebx, Operand(esp, 0), edx);
|
|
|
|
__ cmp(ebx, Immediate(0x56677880u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// shrx
|
|
|
|
__ mov(edx, Immediate(4));
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ shrx(ebx, ecx, edx);
|
|
|
|
__ cmp(ebx, Immediate(0x05566778u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ shrx(ebx, Operand(esp, 0), edx);
|
|
|
|
__ cmp(ebx, Immediate(0x05566778u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
// rorx
|
|
|
|
__ inc(eax);
|
|
|
|
__ rorx(ebx, ecx, 0x4);
|
|
|
|
__ cmp(ebx, Immediate(0x85566778u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ inc(eax);
|
|
|
|
__ rorx(ebx, Operand(esp, 0), 0x4);
|
|
|
|
__ cmp(ebx, Immediate(0x85566778u)); // expected result
|
|
|
|
__ j(not_equal, &exit);
|
|
|
|
|
|
|
|
__ xor_(eax, eax);
|
|
|
|
__ bind(&exit);
|
|
|
|
__ pop(ecx);
|
|
|
|
__ pop(esi);
|
|
|
|
__ pop(ebx);
|
|
|
|
__ ret(0);
|
|
|
|
}
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2015-04-09 06:50:52 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2015-04-09 06:50:52 +00:00
|
|
|
#endif
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F0>::FromCode(*code);
|
|
|
|
CHECK_EQ(0, f.Call());
|
2015-04-09 06:50:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2015-02-06 08:51:39 +00:00
|
|
|
TEST(AssemblerIa32JumpTables1) {
|
|
|
|
// Test jump tables with forward jumps.
|
|
|
|
CcTest::InitializeVM();
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{});
|
2015-02-06 08:51:39 +00:00
|
|
|
|
|
|
|
const int kNumCases = 512;
|
|
|
|
int values[kNumCases];
|
|
|
|
isolate->random_number_generator()->NextBytes(values, sizeof(values));
|
|
|
|
Label labels[kNumCases];
|
|
|
|
|
|
|
|
Label done, table;
|
|
|
|
__ mov(eax, Operand(esp, 4));
|
2019-02-14 16:22:26 +00:00
|
|
|
__ jmp(Operand::JumpTable(eax, times_system_pointer_size, &table));
|
2015-02-06 08:51:39 +00:00
|
|
|
__ ud2();
|
|
|
|
__ bind(&table);
|
|
|
|
for (int i = 0; i < kNumCases; ++i) {
|
|
|
|
__ dd(&labels[i]);
|
|
|
|
}
|
|
|
|
|
|
|
|
for (int i = 0; i < kNumCases; ++i) {
|
|
|
|
__ bind(&labels[i]);
|
|
|
|
__ mov(eax, Immediate(values[i]));
|
|
|
|
__ jmp(&done);
|
|
|
|
}
|
|
|
|
|
|
|
|
__ bind(&done);
|
|
|
|
__ ret(0);
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2015-02-06 08:51:39 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2015-02-06 08:51:39 +00:00
|
|
|
#endif
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F1>::FromCode(*code);
|
2015-02-06 08:51:39 +00:00
|
|
|
for (int i = 0; i < kNumCases; ++i) {
|
2021-12-15 09:47:21 +00:00
|
|
|
int res = f.Call(i);
|
2015-02-06 08:51:39 +00:00
|
|
|
::printf("f(%d) = %d\n", i, res);
|
|
|
|
CHECK_EQ(values[i], res);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
TEST(AssemblerIa32JumpTables2) {
|
|
|
|
// Test jump tables with backward jumps.
|
|
|
|
CcTest::InitializeVM();
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{});
|
2015-02-06 08:51:39 +00:00
|
|
|
|
|
|
|
const int kNumCases = 512;
|
|
|
|
int values[kNumCases];
|
|
|
|
isolate->random_number_generator()->NextBytes(values, sizeof(values));
|
|
|
|
Label labels[kNumCases];
|
|
|
|
|
|
|
|
Label done, table;
|
|
|
|
__ mov(eax, Operand(esp, 4));
|
2019-02-14 16:22:26 +00:00
|
|
|
__ jmp(Operand::JumpTable(eax, times_system_pointer_size, &table));
|
2015-02-06 08:51:39 +00:00
|
|
|
__ ud2();
|
|
|
|
|
|
|
|
for (int i = 0; i < kNumCases; ++i) {
|
|
|
|
__ bind(&labels[i]);
|
|
|
|
__ mov(eax, Immediate(values[i]));
|
|
|
|
__ jmp(&done);
|
|
|
|
}
|
|
|
|
|
|
|
|
__ bind(&table);
|
|
|
|
for (int i = 0; i < kNumCases; ++i) {
|
|
|
|
__ dd(&labels[i]);
|
|
|
|
}
|
|
|
|
|
|
|
|
__ bind(&done);
|
|
|
|
__ ret(0);
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2015-02-06 08:51:39 +00:00
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2015-02-06 08:51:39 +00:00
|
|
|
#endif
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F1>::FromCode(*code);
|
2015-02-06 08:51:39 +00:00
|
|
|
for (int i = 0; i < kNumCases; ++i) {
|
2021-12-15 09:47:21 +00:00
|
|
|
int res = f.Call(i);
|
2015-02-06 08:51:39 +00:00
|
|
|
::printf("f(%d) = %d\n", i, res);
|
|
|
|
CHECK_EQ(values[i], res);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-06-28 18:35:12 +00:00
|
|
|
TEST(Regress621926) {
|
|
|
|
// Bug description:
|
|
|
|
// The opcodes for cmpw r/m16, r16 and cmpw r16, r/m16 were swapped.
|
|
|
|
// This was causing non-commutative comparisons to produce the wrong result.
|
|
|
|
CcTest::InitializeVM();
|
|
|
|
Isolate* isolate = reinterpret_cast<Isolate*>(CcTest::isolate());
|
|
|
|
HandleScope scope(isolate);
|
2019-01-16 18:29:52 +00:00
|
|
|
Assembler assm(AssemblerOptions{});
|
2016-06-28 18:35:12 +00:00
|
|
|
|
2016-06-29 08:52:31 +00:00
|
|
|
uint16_t a = 42;
|
2016-06-28 18:35:12 +00:00
|
|
|
|
|
|
|
Label fail;
|
|
|
|
__ push(ebx);
|
|
|
|
__ mov(ebx, Immediate(reinterpret_cast<intptr_t>(&a)));
|
|
|
|
__ mov(eax, Immediate(41));
|
2016-06-29 08:52:31 +00:00
|
|
|
__ cmpw(eax, Operand(ebx, 0));
|
2016-06-28 18:35:12 +00:00
|
|
|
__ j(above_equal, &fail);
|
2016-06-29 08:52:31 +00:00
|
|
|
__ cmpw(Operand(ebx, 0), eax);
|
2016-06-28 18:35:12 +00:00
|
|
|
__ j(below_equal, &fail);
|
|
|
|
__ mov(eax, 1);
|
|
|
|
__ pop(ebx);
|
|
|
|
__ ret(0);
|
|
|
|
__ bind(&fail);
|
|
|
|
__ mov(eax, 0);
|
|
|
|
__ pop(ebx);
|
|
|
|
__ ret(0);
|
|
|
|
|
|
|
|
CodeDesc desc;
|
2017-05-31 14:00:11 +00:00
|
|
|
assm.GetCode(isolate, &desc);
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
Handle<Code> code =
|
|
|
|
Factory::CodeBuilder(isolate, desc, CodeKind::FOR_TESTING).Build();
|
2016-06-28 18:35:12 +00:00
|
|
|
|
|
|
|
#ifdef OBJECT_PRINT
|
2018-06-14 12:46:07 +00:00
|
|
|
StdoutStream os;
|
2018-07-12 10:06:42 +00:00
|
|
|
code->Print(os);
|
2016-06-28 18:35:12 +00:00
|
|
|
#endif
|
|
|
|
|
2021-12-15 09:47:21 +00:00
|
|
|
auto f = GeneratedCode<F0>::FromCode(*code);
|
|
|
|
CHECK_EQ(1, f.Call());
|
2016-06-28 18:35:12 +00:00
|
|
|
}
|
|
|
|
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
TEST(DeoptExitSizeIsFixed) {
|
|
|
|
CHECK(Deoptimizer::kSupportsFixedDeoptExitSizes);
|
|
|
|
|
|
|
|
Isolate* isolate = CcTest::i_isolate();
|
|
|
|
HandleScope handles(isolate);
|
|
|
|
v8::internal::byte buffer[256];
|
|
|
|
MacroAssembler masm(isolate, v8::internal::CodeObjectRequired::kYes,
|
|
|
|
ExternalAssemblerBuffer(buffer, sizeof(buffer)));
|
|
|
|
|
|
|
|
STATIC_ASSERT(static_cast<int>(kFirstDeoptimizeKind) == 0);
|
|
|
|
for (int i = 0; i < kDeoptimizeKindCount; i++) {
|
|
|
|
DeoptimizeKind kind = static_cast<DeoptimizeKind>(i);
|
|
|
|
Label before_exit;
|
|
|
|
masm.bind(&before_exit);
|
[Turboprop] Move deoptimizations for dynamic map checks into builtin.
In order to reduce the codegen size of dynamic map checks, add the
ability to have an eager with resume deopt point, which can call
a given builitin to perform a more detailed check than can be done
in codegen, and then either deoptimizes itself (as if the calling
code had performed an eager deopt) or resumes execution in the
calling code after the check.
In addition, support for adding extra arguments to a
deoptimization continuation is added to enable us to pass the
necessary arguments to the DynamicMapChecks builtin.
Finally, a trampoline is added to the DynamicMapChecks which saves
the registers that might be clobbered by that builtin, to avoid
having to save them in the generated code. This trampoline also
performs the deoptimization based on the result of the
DynamicMapChecks builtin.
In order to ensure both the trampoline and DynamicMapChecks
builtin have the same call interface, and to limit the number
of registers that need saving in the trampoline, the
DynamicMapChecks builtin is moved to be a CSA builtin with a
custom CallInterfaceDescriptor, that calls an exported Torque
macro that implements the actual functionality.
All told, this changes the codegen for a monomorphic dynamic
map check from:
movl rbx,<expected_map>
cmpl [<object>-0x1],rbx
jnz <deferred_call>
resume_point:
...
deferred_call:
<spill registers>
movl rax,<slot>
movq rbx,<object>
movq rcx,<handler>
movq r10,<DynamicMapChecks>
call r10
cmpq rax,0x0
jz <restore_regs>
cmpq rax,0x1
jz <deopt_point_1>
cmpq rax,0x2
jz <deopt_point_2>
int3l
restore_regs:
<restore_regs>
jmp <resume_point>
...
deopt_point_1:
call Deoptimization_Eager
deopt_point_2:
call Deoptimization_Bailout
To: movl rax,<slot>
movl rcx,<expected_map>
movq rdx,<handler>
cmpl [<object>-0x1],rcx
jnz <deopt_point>
resume_point:
...
deopt_point:
call DynamicMapChecksTrampoline
jmp <resume_point>
BUG=v8:10582
Change-Id: Ica4927b9acc963b9b73dc62d9379a7815335650f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2560197
Commit-Queue: Ross McIlroy <rmcilroy@chromium.org>
Reviewed-by: Georg Neis <neis@chromium.org>
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#71545}
2020-12-01 17:45:40 +00:00
|
|
|
if (kind == DeoptimizeKind::kEagerWithResume) {
|
2021-06-07 15:24:12 +00:00
|
|
|
Builtin target = Deoptimizer::GetDeoptWithResumeBuiltin(
|
2020-12-02 09:34:53 +00:00
|
|
|
DeoptimizeReason::kDynamicCheckMaps);
|
[Turboprop] Move deoptimizations for dynamic map checks into builtin.
In order to reduce the codegen size of dynamic map checks, add the
ability to have an eager with resume deopt point, which can call
a given builitin to perform a more detailed check than can be done
in codegen, and then either deoptimizes itself (as if the calling
code had performed an eager deopt) or resumes execution in the
calling code after the check.
In addition, support for adding extra arguments to a
deoptimization continuation is added to enable us to pass the
necessary arguments to the DynamicMapChecks builtin.
Finally, a trampoline is added to the DynamicMapChecks which saves
the registers that might be clobbered by that builtin, to avoid
having to save them in the generated code. This trampoline also
performs the deoptimization based on the result of the
DynamicMapChecks builtin.
In order to ensure both the trampoline and DynamicMapChecks
builtin have the same call interface, and to limit the number
of registers that need saving in the trampoline, the
DynamicMapChecks builtin is moved to be a CSA builtin with a
custom CallInterfaceDescriptor, that calls an exported Torque
macro that implements the actual functionality.
All told, this changes the codegen for a monomorphic dynamic
map check from:
movl rbx,<expected_map>
cmpl [<object>-0x1],rbx
jnz <deferred_call>
resume_point:
...
deferred_call:
<spill registers>
movl rax,<slot>
movq rbx,<object>
movq rcx,<handler>
movq r10,<DynamicMapChecks>
call r10
cmpq rax,0x0
jz <restore_regs>
cmpq rax,0x1
jz <deopt_point_1>
cmpq rax,0x2
jz <deopt_point_2>
int3l
restore_regs:
<restore_regs>
jmp <resume_point>
...
deopt_point_1:
call Deoptimization_Eager
deopt_point_2:
call Deoptimization_Bailout
To: movl rax,<slot>
movl rcx,<expected_map>
movq rdx,<handler>
cmpl [<object>-0x1],rcx
jnz <deopt_point>
resume_point:
...
deopt_point:
call DynamicMapChecksTrampoline
jmp <resume_point>
BUG=v8:10582
Change-Id: Ica4927b9acc963b9b73dc62d9379a7815335650f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2560197
Commit-Queue: Ross McIlroy <rmcilroy@chromium.org>
Reviewed-by: Georg Neis <neis@chromium.org>
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#71545}
2020-12-01 17:45:40 +00:00
|
|
|
masm.CallForDeoptimization(target, 42, &before_exit, kind, &before_exit,
|
|
|
|
nullptr);
|
|
|
|
CHECK_EQ(masm.SizeOfCodeGeneratedSince(&before_exit),
|
2020-12-16 17:13:42 +00:00
|
|
|
Deoptimizer::kEagerWithResumeBeforeArgsSize);
|
[Turboprop] Move deoptimizations for dynamic map checks into builtin.
In order to reduce the codegen size of dynamic map checks, add the
ability to have an eager with resume deopt point, which can call
a given builitin to perform a more detailed check than can be done
in codegen, and then either deoptimizes itself (as if the calling
code had performed an eager deopt) or resumes execution in the
calling code after the check.
In addition, support for adding extra arguments to a
deoptimization continuation is added to enable us to pass the
necessary arguments to the DynamicMapChecks builtin.
Finally, a trampoline is added to the DynamicMapChecks which saves
the registers that might be clobbered by that builtin, to avoid
having to save them in the generated code. This trampoline also
performs the deoptimization based on the result of the
DynamicMapChecks builtin.
In order to ensure both the trampoline and DynamicMapChecks
builtin have the same call interface, and to limit the number
of registers that need saving in the trampoline, the
DynamicMapChecks builtin is moved to be a CSA builtin with a
custom CallInterfaceDescriptor, that calls an exported Torque
macro that implements the actual functionality.
All told, this changes the codegen for a monomorphic dynamic
map check from:
movl rbx,<expected_map>
cmpl [<object>-0x1],rbx
jnz <deferred_call>
resume_point:
...
deferred_call:
<spill registers>
movl rax,<slot>
movq rbx,<object>
movq rcx,<handler>
movq r10,<DynamicMapChecks>
call r10
cmpq rax,0x0
jz <restore_regs>
cmpq rax,0x1
jz <deopt_point_1>
cmpq rax,0x2
jz <deopt_point_2>
int3l
restore_regs:
<restore_regs>
jmp <resume_point>
...
deopt_point_1:
call Deoptimization_Eager
deopt_point_2:
call Deoptimization_Bailout
To: movl rax,<slot>
movl rcx,<expected_map>
movq rdx,<handler>
cmpl [<object>-0x1],rcx
jnz <deopt_point>
resume_point:
...
deopt_point:
call DynamicMapChecksTrampoline
jmp <resume_point>
BUG=v8:10582
Change-Id: Ica4927b9acc963b9b73dc62d9379a7815335650f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2560197
Commit-Queue: Ross McIlroy <rmcilroy@chromium.org>
Reviewed-by: Georg Neis <neis@chromium.org>
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#71545}
2020-12-01 17:45:40 +00:00
|
|
|
} else {
|
2021-06-07 15:24:12 +00:00
|
|
|
Builtin target = Deoptimizer::GetDeoptimizationEntry(kind);
|
[Turboprop] Move deoptimizations for dynamic map checks into builtin.
In order to reduce the codegen size of dynamic map checks, add the
ability to have an eager with resume deopt point, which can call
a given builitin to perform a more detailed check than can be done
in codegen, and then either deoptimizes itself (as if the calling
code had performed an eager deopt) or resumes execution in the
calling code after the check.
In addition, support for adding extra arguments to a
deoptimization continuation is added to enable us to pass the
necessary arguments to the DynamicMapChecks builtin.
Finally, a trampoline is added to the DynamicMapChecks which saves
the registers that might be clobbered by that builtin, to avoid
having to save them in the generated code. This trampoline also
performs the deoptimization based on the result of the
DynamicMapChecks builtin.
In order to ensure both the trampoline and DynamicMapChecks
builtin have the same call interface, and to limit the number
of registers that need saving in the trampoline, the
DynamicMapChecks builtin is moved to be a CSA builtin with a
custom CallInterfaceDescriptor, that calls an exported Torque
macro that implements the actual functionality.
All told, this changes the codegen for a monomorphic dynamic
map check from:
movl rbx,<expected_map>
cmpl [<object>-0x1],rbx
jnz <deferred_call>
resume_point:
...
deferred_call:
<spill registers>
movl rax,<slot>
movq rbx,<object>
movq rcx,<handler>
movq r10,<DynamicMapChecks>
call r10
cmpq rax,0x0
jz <restore_regs>
cmpq rax,0x1
jz <deopt_point_1>
cmpq rax,0x2
jz <deopt_point_2>
int3l
restore_regs:
<restore_regs>
jmp <resume_point>
...
deopt_point_1:
call Deoptimization_Eager
deopt_point_2:
call Deoptimization_Bailout
To: movl rax,<slot>
movl rcx,<expected_map>
movq rdx,<handler>
cmpl [<object>-0x1],rcx
jnz <deopt_point>
resume_point:
...
deopt_point:
call DynamicMapChecksTrampoline
jmp <resume_point>
BUG=v8:10582
Change-Id: Ica4927b9acc963b9b73dc62d9379a7815335650f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2560197
Commit-Queue: Ross McIlroy <rmcilroy@chromium.org>
Reviewed-by: Georg Neis <neis@chromium.org>
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#71545}
2020-12-01 17:45:40 +00:00
|
|
|
masm.CallForDeoptimization(target, 42, &before_exit, kind, &before_exit,
|
|
|
|
nullptr);
|
|
|
|
CHECK_EQ(masm.SizeOfCodeGeneratedSince(&before_exit),
|
|
|
|
kind == DeoptimizeKind::kLazy
|
|
|
|
? Deoptimizer::kLazyDeoptExitSize
|
|
|
|
: Deoptimizer::kNonLazyDeoptExitSize);
|
|
|
|
}
|
Reland "Reland "[deoptimizer] Change deopt entries into builtins""
This is a reland of fbfa9bf4ec72b1b73a96b70ccb68cd98c321511b
The arm64 was missing proper codegen for CFI, thus sizes were off.
Original change's description:
> Reland "[deoptimizer] Change deopt entries into builtins"
>
> This is a reland of 7f58ced72eb65b6b5530ccabaf2eaebe45bf9d33
>
> It fixes the different exit size emitted on x64/Atom CPUs due to
> performance tuning in TurboAssembler::Call. Additionally, add
> cctests to verify the fixed size exits.
>
> Original change's description:
> > [deoptimizer] Change deopt entries into builtins
> >
> > While the overall goal of this commit is to change deoptimization
> > entries into builtins, there are multiple related things happening:
> >
> > - Deoptimization entries, formerly stubs (i.e. Code objects generated
> > at runtime, guaranteed to be immovable), have been converted into
> > builtins. The major restriction is that we now need to preserve the
> > kRootRegister, which was formerly used on most architectures to pass
> > the deoptimization id. The solution differs based on platform.
> > - Renamed DEOPT_ENTRIES_OR_FOR_TESTING code kind to FOR_TESTING.
> > - Removed heap/ support for immovable Code generation.
> > - Removed the DeserializerData class (no longer needed).
> > - arm64: to preserve 4-byte deopt exits, introduced a new optimization
> > in which the final jump to the deoptimization entry is generated
> > once per Code object, and deopt exits can continue to emit a
> > near-call.
> > - arm,ia32,x64: change to fixed-size deopt exits. This reduces exit
> > sizes by 4/8, 5, and 5 bytes, respectively.
> >
> > On arm the deopt exit size is reduced from 12 (or 16) bytes to 8 bytes
> > by using the same strategy as on arm64 (recalc deopt id from return
> > address). Before:
> >
> > e300a002 movw r10, <id>
> > e59fc024 ldr ip, [pc, <entry offset>]
> > e12fff3c blx ip
> >
> > After:
> >
> > e59acb35 ldr ip, [r10, <entry offset>]
> > e12fff3c blx ip
> >
> > On arm64 the deopt exit size remains 4 bytes (or 8 bytes in same cases
> > with CFI). Additionally, up to 4 builtin jumps are emitted per Code
> > object (max 32 bytes added overhead per Code object). Before:
> >
> > 9401cdae bl <entry offset>
> >
> > After:
> >
> > # eager deoptimization entry jump.
> > f95b1f50 ldr x16, [x26, <eager entry offset>]
> > d61f0200 br x16
> > # lazy deoptimization entry jump.
> > f95b2b50 ldr x16, [x26, <lazy entry offset>]
> > d61f0200 br x16
> > # the deopt exit.
> > 97fffffc bl <eager deoptimization entry jump offset>
> >
> > On ia32 the deopt exit size is reduced from 10 to 5 bytes. Before:
> >
> > bb00000000 mov ebx,<id>
> > e825f5372b call <entry>
> >
> > After:
> >
> > e8ea2256ba call <entry>
> >
> > On x64 the deopt exit size is reduced from 12 to 7 bytes. Before:
> >
> > 49c7c511000000 REX.W movq r13,<id>
> > e8ea2f0700 call <entry>
> >
> > After:
> >
> > 41ff9560360000 call [r13+<entry offset>]
> >
> > Bug: v8:8661,v8:8768
> > Change-Id: I13e30aedc360474dc818fecc528ce87c3bfeed42
> > Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2465834
> > Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> > Reviewed-by: Ross McIlroy <rmcilroy@chromium.org>
> > Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> > Reviewed-by: Ulan Degenbaev <ulan@chromium.org>
> > Cr-Commit-Position: refs/heads/master@{#70597}
>
> Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
> Bug: v8:8661,v8:8768,chromium:1140165
> Change-Id: Ibcd5c39c58a70bf2b2ac221aa375fc68d495e144
> Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2485506
> Reviewed-by: Jakob Gruber <jgruber@chromium.org>
> Reviewed-by: Tobias Tebbi <tebbi@chromium.org>
> Commit-Queue: Jakob Gruber <jgruber@chromium.org>
> Cr-Commit-Position: refs/heads/master@{#70655}
Tbr: ulan@chromium.org, tebbi@chromium.org, rmcilroy@chromium.org
Bug: v8:8661
Bug: v8:8768
Bug: chromium:1140165
Change-Id: I471cc94fc085e527dc9bfb5a84b96bd907c2333f
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2488682
Reviewed-by: Jakob Gruber <jgruber@chromium.org>
Commit-Queue: Jakob Gruber <jgruber@chromium.org>
Cr-Commit-Position: refs/heads/master@{#70672}
2020-10-21 05:12:25 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
[x64][ia32] Reconcile supported extensions
This is similar in spirit to https://crrev.com/c/2808621, which is to
ensure that no matter what combination of --[no-]enable-{extension} flag
is passed, we end up with a set of supported extensions that make sense.
The 2 rules are:
- If a newer extension is supported (SSE4_2), older extensions are
supported (SSE4_1, SSSE3, SSE3),
- If an older extension is not supported (SSE4_1), new extensions are
not supported (SSE4_2, AVX)
Tests have been added to both ia32 and x64 to check that we follow these
above 2 rules.
We change the ProbeImpl to have a reconciliation step to ensure that we
stick to the 2 rules.
E.g. if --enable-avx --no-enable-sse4-2, we will first set AVX to
supported, then in the second step, fix-up AVX to unsupported. In this
sense, the --no version of the flags take priority. This more accurately
follows the intention of the flags.
Bug: chromium:1195579
Change-Id: I0390f24de9d203fe6bbd4cc02a23771a1f052618
Reviewed-on: https://chromium-review.googlesource.com/c/v8/v8/+/2818570
Commit-Queue: Zhi An Ng <zhin@chromium.org>
Reviewed-by: Michael Achenbach <machenbach@chromium.org>
Reviewed-by: Clemens Backes <clemensb@chromium.org>
Reviewed-by: Andreas Haas <ahaas@chromium.org>
Cr-Commit-Position: refs/heads/master@{#73942}
2021-04-13 20:56:47 +00:00
|
|
|
TEST(CpuFeatures_ProbeImpl) {
|
|
|
|
// Support for a newer extension implies support for the older extensions.
|
|
|
|
CHECK_IMPLIES(CpuFeatures::IsSupported(FMA3), CpuFeatures::IsSupported(AVX));
|
|
|
|
CHECK_IMPLIES(CpuFeatures::IsSupported(AVX2), CpuFeatures::IsSupported(AVX));
|
|
|
|
CHECK_IMPLIES(CpuFeatures::IsSupported(AVX),
|
|
|
|
CpuFeatures::IsSupported(SSE4_2));
|
|
|
|
CHECK_IMPLIES(CpuFeatures::IsSupported(SSE4_2),
|
|
|
|
CpuFeatures::IsSupported(SSE4_1));
|
|
|
|
CHECK_IMPLIES(CpuFeatures::IsSupported(SSE4_1),
|
|
|
|
CpuFeatures::IsSupported(SSSE3));
|
|
|
|
CHECK_IMPLIES(CpuFeatures::IsSupported(SSSE3),
|
|
|
|
CpuFeatures::IsSupported(SSE3));
|
|
|
|
|
|
|
|
// Check the reverse, if an older extension is not supported, a newer
|
|
|
|
// extension cannot be supported.
|
|
|
|
CHECK_IMPLIES(!CpuFeatures::IsSupported(SSE3),
|
|
|
|
!CpuFeatures::IsSupported(SSSE3));
|
|
|
|
CHECK_IMPLIES(!CpuFeatures::IsSupported(SSSE3),
|
|
|
|
!CpuFeatures::IsSupported(SSE4_1));
|
|
|
|
CHECK_IMPLIES(!CpuFeatures::IsSupported(SSE4_1),
|
|
|
|
!CpuFeatures::IsSupported(SSE4_2));
|
|
|
|
CHECK_IMPLIES(!CpuFeatures::IsSupported(SSE4_2),
|
|
|
|
!CpuFeatures::IsSupported(AVX));
|
|
|
|
CHECK_IMPLIES(!CpuFeatures::IsSupported(AVX),
|
|
|
|
!CpuFeatures::IsSupported(AVX2));
|
|
|
|
CHECK_IMPLIES(!CpuFeatures::IsSupported(AVX),
|
|
|
|
!CpuFeatures::IsSupported(FMA3));
|
|
|
|
}
|
|
|
|
|
2008-08-22 13:33:59 +00:00
|
|
|
#undef __
|
2017-08-31 12:34:55 +00:00
|
|
|
|
|
|
|
} // namespace internal
|
|
|
|
} // namespace v8
|