mongodb · vbabanin · Apr 24, 2025 · Mar 31, 2025 · Apr 3, 2025 · Apr 3, 2025
diff --git a/bson/src/main/org/bson/ByteBuf.java b/bson/src/main/org/bson/ByteBuf.java
@@ -136,6 +136,26 @@ public interface ByteBuf  {
      */
     byte[] array();
 
+    /**
+     * <p>States whether this buffer is backed by an accessible byte array.</p>
+     *
+     * <p>If this method returns {@code true} then the {@link #array()} and {@link #arrayOffset()} methods may safely be invoked.</p>
+     *
+     * @return {@code true} if, and only if, this buffer is backed by an array and is not read-only
+     * @since 5.5
+     */
+    boolean isBackedByArray();
+
+    /**
+     * Returns the offset of the first byte within the backing byte array of
+     * this buffer.
+     *
+     * @throws java.nio.ReadOnlyBufferException If this buffer is backed by an array but is read-only
+     * @throws UnsupportedOperationException if this buffer is not backed by an accessible array
+     * @since 5.5
+     */
+    int arrayOffset();
+
     /**
      * Returns this buffer's limit.
      *

diff --git a/bson/src/main/org/bson/ByteBufNIO.java b/bson/src/main/org/bson/ByteBufNIO.java
@@ -108,6 +108,16 @@ public byte[] array() {
         return buf.array();
     }
 
+    @Override
+    public boolean isBackedByArray() {
+        return buf.hasArray();
+    }
+
+    @Override
+    public int arrayOffset() {
+        return buf.arrayOffset();
+    }
+
     @Override
     public int limit() {
         return buf.limit();

diff --git a/bson/src/main/org/bson/internal/PlatformUtil.java b/bson/src/main/org/bson/internal/PlatformUtil.java
@@ -0,0 +1,52 @@
+/*
+ * Copyright 2008-present MongoDB, Inc.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.bson.internal;
+
+/**
+ * Utility class for platform-specific operations.
+ * This class is not part of the public API and may be removed or changed at any time.
+ */
+public final class PlatformUtil {
+
+    private PlatformUtil() {}
+
+    // These architectures support unaligned memory access.
+    // While others might as well, it's safer to assume they don't.
+    private static final String[] ARCHITECTURES_ALLOWING_UNALIGNED_ACCESS = {
+            "x86",
+            "amd64",
+            "i386",
+            "x86_64",
+            "arm64", // evergreen dbx-perf-distro uses this architecture
+            "aarch64"};
+
+    public static boolean isUnalignedAccessAllowed() {
+        try {
+            String processArch = System.getProperty("os.arch");
+            for (String supportedArch : ARCHITECTURES_ALLOWING_UNALIGNED_ACCESS) {
+                if (supportedArch.equals(processArch)) {
+                    return true;
+                }
+            }
+            return false;
+        } catch (Exception e) {
+            // Ignore security exception and proceed with default value
+            return false;
+        }
+    }
+}
+
diff --git a/bson/src/main/org/bson/io/ByteBufferBsonInput.java b/bson/src/main/org/bson/io/ByteBufferBsonInput.java
@@ -24,6 +24,7 @@
 import java.nio.charset.StandardCharsets;
 
 import static java.lang.String.format;
+import static org.bson.internal.PlatformUtil.isUnalignedAccessAllowed;
 
 /**
  * An implementation of {@code BsonInput} that is backed by a {@code ByteBuf}.
@@ -33,6 +34,14 @@
 public class ByteBufferBsonInput implements BsonInput {
 
     private static final String[] ONE_BYTE_ASCII_STRINGS = new String[Byte.MAX_VALUE + 1];
+    private static final boolean UNALIGNED_ACCESS_SUPPORTED = isUnalignedAccessAllowed();
+    /* A dynamically sized scratch buffer, that is reused across BSON String reads:
+     * 1. Reduces garbage collection by avoiding new byte array creation.
+     * 2. Improves cache utilization through temporal locality.
+     * 3. Avoids JVM allocation and zeroing cost for new memory allocations.
+     */
+    private byte[] scratchBuffer;
+
 
     static {
         for (int b = 0; b < ONE_BYTE_ASCII_STRINGS.length; b++) {
@@ -127,15 +136,12 @@ public String readString() {
 
     @Override
     public String readCString() {
-        int mark = buffer.position();
-        skipCString();
-        int size = buffer.position() - mark;
-        buffer.position(mark);
+        int size = computeCStringLength(buffer.position());
         return readString(size);
     }
 
-    private String readString(final int size) {
-        if (size == 2) {
+    private String readString(final int bsonStringSize) {
+        if (bsonStringSize == 2) {
             byte asciiByte = buffer.get();               // if only one byte in the string, it must be ascii.
             byte nullByte = buffer.get();                // read null terminator
             if (nullByte != 0) {
@@ -146,26 +152,74 @@ private String readString(final int size) {
             }
             return ONE_BYTE_ASCII_STRINGS[asciiByte];  // this will throw if asciiByte is negative
         } else {
-            byte[] bytes = new byte[size - 1];
-            buffer.get(bytes);
-            byte nullByte = buffer.get();
-            if (nullByte != 0) {
-                throw new BsonSerializationException("Found a BSON string that is not null-terminated");
+            if (buffer.isBackedByArray()) {
+                int position = buffer.position();
+                int arrayOffset = buffer.arrayOffset();
+                int newPosition = position + bsonStringSize;
+                buffer.position(newPosition);
+
+                byte[] array = buffer.array();
+                if (array[arrayOffset + newPosition - 1] != 0) {
+                    throw new BsonSerializationException("Found a BSON string that is not null-terminated");
+                }
+                return new String(array, arrayOffset + position, bsonStringSize - 1, StandardCharsets.UTF_8);
+            } else if (scratchBuffer == null || bsonStringSize > scratchBuffer.length) {
+                int scratchBufferSize = bsonStringSize + (bsonStringSize >>> 1); //1.5 times the size
+                scratchBuffer = new byte[scratchBufferSize];
             }
-            return new String(bytes, StandardCharsets.UTF_8);
+
+            buffer.get(scratchBuffer, 0, bsonStringSize);
+            if (scratchBuffer[bsonStringSize - 1] != 0) {
+                throw new BsonSerializationException("BSON string not null-terminated");
+            }
+            return new String(scratchBuffer, 0, bsonStringSize - 1, StandardCharsets.UTF_8);
         }
     }
 
     @Override
     public void skipCString() {
         ensureOpen();
-        boolean checkNext = true;
-        while (checkNext) {
-            if (!buffer.hasRemaining()) {
-                throw new BsonSerializationException("Found a BSON string that is not null-terminated");
+        int pos = buffer.position();
+        int length = computeCStringLength(pos);
+        buffer.position(pos + length);
+    }
+
+    /*
+         This method uses the SWAR (SIMD Within A Register) technique when aligned access is supported.
+         SWAR finds a null terminator by processing 8 bytes at once.
+     */
+    public int computeCStringLength(final int prevPos) {
+        ensureOpen();
+        int pos = buffer.position();
+        int limit = buffer.limit();
+
+        if (UNALIGNED_ACCESS_SUPPORTED) {
+            int chunks = (limit - pos) >>> 3;
+            // Process 8 bytes at a time.
+            for (int i = 0; i < chunks; i++) {
+                long word = buffer.getLong(pos);
+                long mask = word - 0x0101010101010101L;
+                mask &= ~word;
+                mask &= 0x8080808080808080L;
+                if (mask != 0) {
+                    // first null terminator found in the Little Endian long
+                    int offset = Long.numberOfTrailingZeros(mask) >>> 3;
+                    // Found the null at pos + offset; reset buffer's position.
+                    return (pos - prevPos) + offset + 1;
+                }
+                pos += 8;
             }
-            checkNext = buffer.get() != 0;
         }
+
+        // Process remaining bytes one-by-one.
+        while (pos < limit) {
+            if (buffer.get(pos++) == 0) {
+                return (pos - prevPos);
+            }
+        }
+
+        buffer.position(pos);
+        throw new BsonSerializationException("Found a BSON string that is not null-terminated");
     }
 
     @Override

diff --git a/bson/src/test/unit/org/bson/internal/PlatformUtilTest.java b/bson/src/test/unit/org/bson/internal/PlatformUtilTest.java
@@ -0,0 +1,71 @@
+/*
+ * Copyright 2008-present MongoDB, Inc.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.bson.internal;
+
+import org.junit.jupiter.api.DisplayName;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.ValueSource;
+
+import static org.junit.Assert.assertFalse;
+import static org.junit.Assert.assertTrue;
+
+class PlatformUtilTest {
+
+    @ParameterizedTest
+    @ValueSource(strings = {"arm", "ppc", "ppc64", "sparc", "mips"})
+    @DisplayName("Should not allow unaligned access for unsupported architectures")
+    void shouldNotAllowUnalignedAccessForUnsupportedArchitecture(final String architecture) {
+        withSystemProperty("os.arch", architecture, () -> {
+            boolean result = PlatformUtil.isUnalignedAccessAllowed();
+            assertFalse(result);
+        });
+    }
+
+    @Test
+    @DisplayName("Should not allow unaligned access when system property is undefined")
+    void shouldNotAllowUnalignedAccessWhenSystemPropertyIsUndefined() {
+        withSystemProperty("os.arch", null, () -> {
+            boolean result = PlatformUtil.isUnalignedAccessAllowed();
+            assertFalse(result);
+        });
+    }
+
+    @ParameterizedTest
+    @ValueSource(strings = {"x86", "amd64", "i386", "x86_64", "arm64", "aarch64"})
+    @DisplayName("Should allow unaligned access for supported architectures")
+    void shouldAllowUnalignedAccess(final String architecture) {
+        withSystemProperty("os.arch", architecture, () -> {
+            boolean result = PlatformUtil.isUnalignedAccessAllowed();
+            assertTrue(result);
+        });
+    }
+
+    public static void withSystemProperty(final String name, final String value, final Runnable testCode) {
+        String original = System.getProperty(name);
+        if (value == null) {
+            System.clearProperty(name);
+        } else {
+            System.setProperty(name, value);
+        }
+        try {
+            testCode.run();
+        } finally {
+            System.setProperty(name, original);
+        }
+    }
+}
diff --git a/driver-core/src/main/com/mongodb/internal/connection/CompositeByteBuf.java b/driver-core/src/main/com/mongodb/internal/connection/CompositeByteBuf.java
@@ -213,6 +213,16 @@ public byte[] array() {
         throw new UnsupportedOperationException("Not implemented yet!");
     }
 
+    @Override
+    public boolean isBackedByArray() {
+        return false;
+    }
+
+    @Override
+    public int arrayOffset() {
+        throw new UnsupportedOperationException("Not implemented yet!");
+    }
+
     @Override
     public ByteBuf limit(final int newLimit) {
         if (newLimit < 0 || newLimit > capacity()) {

diff --git a/driver-core/src/main/com/mongodb/internal/connection/ResponseBuffers.java b/driver-core/src/main/com/mongodb/internal/connection/ResponseBuffers.java
@@ -53,13 +53,15 @@ <T extends BsonDocument> T getResponseDocument(final int messageId, final Decode
     }
 
     /**
-     * Returns a read-only buffer containing the response body.  Care should be taken to not use the returned buffer after this instance has
+     * Returns a buffer containing the response body.  Care should be taken to not use the returned buffer after this instance has
      * been closed.
      *
-     * @return a read-only buffer containing the response body
+     * NOTE: do not modify this buffer, it is being made writable for performance reasons to avoid redundant copying.
+     *
+     * @return a buffer containing the response body
      */
     public ByteBuf getBodyByteBuffer() {
-        return bodyByteBuffer.asReadOnly();
+        return bodyByteBuffer;
     }
 
     public void reset() {

diff --git a/driver-core/src/main/com/mongodb/internal/connection/netty/NettyByteBuf.java b/driver-core/src/main/com/mongodb/internal/connection/netty/NettyByteBuf.java
@@ -100,6 +100,16 @@ public byte[] array() {
         return proxied.array();
     }
 
+    @Override
+    public boolean isBackedByArray() {
+        return proxied.hasArray();
+    }
+
+    @Override
+    public int arrayOffset() {
+        return proxied.arrayOffset();
+    }
+
     @Override
     public int limit() {
         if (isWriting) {