8339531: Improve performance of MemorySegment::mismatch

Reviewed-by: mcimadamore
This commit is contained in:
Per Minborg 2024-09-12 18:31:08 +00:00
parent ab9b72c50a
commit 81ff91ef27
7 changed files with 559 additions and 211 deletions

View file

@ -41,21 +41,16 @@ import java.lang.foreign.MemorySegment;
import java.nio.ByteBuffer;
import java.util.concurrent.TimeUnit;
import static java.lang.foreign.ValueLayout.*;
@BenchmarkMode(Mode.AverageTime)
@Warmup(iterations = 5, time = 500, timeUnit = TimeUnit.MILLISECONDS)
@Measurement(iterations = 10, time = 500, timeUnit = TimeUnit.MILLISECONDS)
@State(Scope.Thread)
@OutputTimeUnit(TimeUnit.NANOSECONDS)
@Fork(value = 3)
public class CopyTest {
public class SegmentBulkCopy {
@Param({"0", "1", "2", "3", "4", "5", "6", "7", "8",
"9", "10", "11", "12", "13", "14", "15", "16",
"17", "18", "19", "20", "21", "22", "23", "24",
"25", "26", "27", "28", "29", "30", "31", "32",
"33", "36", "40", "44", "48", "52", "56", "60", "63", "64", "128"})
@Param({"2", "3", "4", "5", "6", "7", "8", "64", "512",
"4096", "32768", "262144", "2097152", "16777216", "134217728"})
public int ELEM_SIZE;
byte[] srcArray;
@ -80,28 +75,37 @@ public class CopyTest {
}
@Benchmark
public void array_copy() {
public void arrayCopy() {
System.arraycopy(srcArray, 0, dstArray, 0, ELEM_SIZE);
}
@Benchmark
public void heap_segment_copy5Arg() {
MemorySegment.copy(heapSrcSegment, 0, heapDstSegment, 0, ELEM_SIZE);
}
@Benchmark
public void native_segment_copy5Arg() {
MemorySegment.copy(nativeSrcSegment, 0, nativeDstSegment, 0, ELEM_SIZE);
}
@Benchmark
public void heap_segment_copy7arg() {
MemorySegment.copy(heapSrcSegment, JAVA_BYTE, 0, heapDstSegment, JAVA_BYTE, 0, ELEM_SIZE);
}
@Benchmark
public void buffer_copy() {
public void bufferCopy() {
dstBuffer.put(srcBuffer);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.copy=31"})
@Benchmark
public void heapSegmentCopyJava() {
MemorySegment.copy(heapSrcSegment, 0, heapDstSegment, 0, ELEM_SIZE);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.copy=0"})
@Benchmark
public void heapSegmentCopyUnsafe() {
MemorySegment.copy(heapSrcSegment, 0, heapDstSegment, 0, ELEM_SIZE);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.copy=31"})
@Benchmark
public void nativeSegmentCopyJava() {
MemorySegment.copy(nativeSrcSegment, 0, nativeDstSegment, 0, ELEM_SIZE);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.copy=0"})
@Benchmark
public void nativeSegmentCopyUnsafe() {
MemorySegment.copy(nativeSrcSegment, 0, nativeDstSegment, 0, ELEM_SIZE);
}
}

View file

@ -48,13 +48,10 @@ import java.util.concurrent.TimeUnit;
@State(Scope.Thread)
@OutputTimeUnit(TimeUnit.NANOSECONDS)
@Fork(value = 3)
public class TestFill {
public class SegmentBulkFill {
@Param({"0", "1", "2", "3", "4", "5", "6", "7",
"8", "9", "10", "11", "12", "13", "14", "15",
"16", "17", "18", "19", "20", "21", "22", "23",
"24", "25", "26", "27", "28", "29", "30", "31",
"32", "128", "256", "384", "511", "512"})
@Param({"2", "3", "4", "5", "6", "7", "8", "64", "512",
"4096", "32768", "262144", "2097152", "16777216", "134217728"})
public int ELEM_SIZE;
byte[] array;
@ -73,22 +70,43 @@ public class TestFill {
}
@Benchmark
public void arrays_fill() {
public void arraysFill() {
Arrays.fill(array, (byte) 0);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.fill=31"})
@Benchmark
public void heap_segment_fill() {
public void heapSegmentFillJava() {
heapSegment.fill((byte) 0);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.fill=0"})
@Benchmark
public void native_segment_fill() {
public void heapSegmentFillUnsafe() {
heapSegment.fill((byte) 0);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.fill=31"})
@Benchmark
public void nativeSegmentFillJava() {
nativeSegment.fill((byte) 0);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.fill=0"})
@Benchmark
public void unaligned_segment_fill() {
public void nativeSegmentFillUnsafe() {
nativeSegment.fill((byte) 0);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.fill=31"})
@Benchmark
public void unalignedSegmentFillJava() {
unalignedSegment.fill((byte) 0);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.fill=0"})
@Benchmark
public void unalignedSegmentFillUnsafe() {
unalignedSegment.fill((byte) 0);
}

View file

@ -0,0 +1,112 @@
/*
* Copyright (c) 2024, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
* or visit www.oracle.com if you need additional information or have any
* questions.
*
*/
package org.openjdk.bench.java.lang.foreign;
import org.openjdk.jmh.annotations.Benchmark;
import org.openjdk.jmh.annotations.BenchmarkMode;
import org.openjdk.jmh.annotations.Fork;
import org.openjdk.jmh.annotations.Measurement;
import org.openjdk.jmh.annotations.Mode;
import org.openjdk.jmh.annotations.OutputTimeUnit;
import org.openjdk.jmh.annotations.Param;
import org.openjdk.jmh.annotations.Scope;
import org.openjdk.jmh.annotations.Setup;
import org.openjdk.jmh.annotations.State;
import org.openjdk.jmh.annotations.Warmup;
import java.lang.foreign.Arena;
import java.lang.foreign.MemorySegment;
import java.util.Arrays;
import java.util.Random;
import java.util.concurrent.TimeUnit;
import static java.lang.foreign.ValueLayout.*;
@BenchmarkMode(Mode.AverageTime)
@Warmup(iterations = 5, time = 500, timeUnit = TimeUnit.MILLISECONDS)
@Measurement(iterations = 10, time = 500, timeUnit = TimeUnit.MILLISECONDS)
@State(Scope.Thread)
@OutputTimeUnit(TimeUnit.NANOSECONDS)
@Fork(value = 3)
public class SegmentBulkMismatch {
@Param({"2", "3", "4", "5", "6", "7", "8", "64", "512",
"4096", "32768", "262144", "2097152", "16777216", "134217728"})
public int ELEM_SIZE;
MemorySegment srcNative;
MemorySegment dstNative;
byte[] srcArray;
byte[] dstArray;
MemorySegment srcHeap;
MemorySegment dstHeap;
@Setup
public void setup() {
// Always use the same alignment regardless of size
srcNative = Arena.ofAuto().allocate(ELEM_SIZE,16);
dstNative = Arena.ofAuto().allocate(ELEM_SIZE, 16);
var rnd = new Random(42);
for (int i = 0; i < ELEM_SIZE; i++) {
srcNative.set(JAVA_BYTE, i, (byte) rnd.nextInt(Byte.MIN_VALUE, Byte.MAX_VALUE));
}
dstNative.copyFrom(srcNative);
srcArray = srcNative.toArray(JAVA_BYTE);
dstArray = dstNative.toArray(JAVA_BYTE);
srcHeap = MemorySegment.ofArray(srcArray);
dstHeap = MemorySegment.ofArray(dstArray);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.mismatch=31"})
@Benchmark
public long nativeSegmentJava() {
return srcNative.mismatch(dstNative);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.mismatch=31"})
@Benchmark
public long heapSegmentJava() {
return srcHeap.mismatch(dstHeap);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.mismatch=0"})
@Benchmark
public long nativeSegmentUnsafe() {
return srcNative.mismatch(dstNative);
}
@Fork(value = 3, jvmArgsAppend = {"-Djava.lang.foreign.native.threshold.power.mismatch=0"})
@Benchmark
public long heapSegmentUnsafe() {
return srcHeap.mismatch(dstHeap);
}
@Benchmark
public long array() {
return Arrays.mismatch(srcArray, dstArray);
}
}