IsValidUtf8TestUtil.java example

Explorer

MaritimeCloud-master
- mc-core
  - src
    - main
      - java
        net
        maritimecloud
        core
        id
        MaritimeId.java
        MmsiId.java
        ServerId.java
        TestId.java
        package-info.java
        internal
        message
        AbstractMessageReader.java
        BinaryUtil.java
        Hashing.java
        MessageHelper.java
        TaggableMessageWriter.java
        TaggableValueWriter.java
        binary
        AbstractBinaryMessageWriter.java
        AbstractBinaryValueReader.java
        AbstractBinaryValueWriter.java
        BinaryUtils.java
        Exceptions.java
        ReaderUtils.java
        compact
        BinaryInputStream.java
        BinaryMessageReader.java
        BinaryMessageWriter.java
        BinaryOutputStream.java
        BinaryValueReader.java
        BinaryValueWriter.java
        FlexibleBinaryValueReader.java
        TReader.java
        TReader8Bit.java
        TReaderConstant.java
        Types.java
        protobuf
        ProtobufMessageReader.java
        ProtobufMessageWriter.java
        ProtobufValueReader.java
        ProtobufValueWriter.java
        ProtobufWireFormat.java
        text
        AbstractTextMessageWriter.java
        AbstractTextValueReader.java
        AbstractTextValueWriter.java
        json
        JsonMessageReader.java
        JsonValueReader.java
        JsonValueWriter.java
        security
        Credentials.java
        SecurityTools.java
        util
        ClassUtil.java
        logging
        AbstractLogger.java
        JDKLogger.java
        LazyJdkLogger.java
        LogFactory.java
        Logger.java
        SLF4JLogger.java
        message
        Message.java
        MessageEnum.java
        MessageEnumSerializer.java
        MessageFormatType.java
        MessageReader.java
        MessageSerializer.java
        MessageVisitor.java
        MessageWriter.java
        SerializationException.java
        ValueReader.java
        ValueSerializer.java
        ValueWriter.java
        package-info.java
        net
        Acknowledgement.java
        BroadcastConsumer.java
        BroadcastMessage.java
        BroadcastSubscription.java
        DispatchedMessage.java
        EndpointImplementation.java
        EndpointInvocationFuture.java
        EndpointRegistration.java
        EndpointUnavailableException.java
        Environment.java
        InternetConnectionType.java
        LocalEndpoint.java
        MessageHeader.java
        package-info.java
        util
        Binary.java
        BoundedBinary.java
        Country.java
        Language.java
        LiteralBinary.java
        RopeBinary.java
        Timestamp.java
        Utf8.java
        geometry
        Area.java
        AreaUnion.java
        Circle.java
        CoordinateConverter.java
        CoordinateSystem.java
        Ellipse.java
        Line.java
        Point.java
        Polygon.java
        Position.java
        PositionReader.java
        PositionReaderSimulator.java
        PositionTime.java
        Rectangle.java
        package-info.java
        package-info.java
        units
        DistanceUnit.java
        SpeedUnit.java
        package-info.java
    - test
      - java
        net
        maritimecloud
        internal
        message
        HashingTest.java
        binary
        protobuf
        AbstractProtobufTest.java
        TestProtobufSerialization.java
        rnd
        RndBaseType.java
        RndMessage.java
        RndTest.java
        RndType.java
        SerializerImpl.java
        text
        json
        AbstractJSONTest.java
        JSONMessageWriterTest.java
        TestReader.java
        TestWriter.java
        message
        TestEnum.java
        util
        BoundedByteStringTest.java
        ByteStringTest.java
        CountryTest.java
        DistanceUnitTest.java
        IsValidUtf8Test.java
        IsValidUtf8TestUtil.java
        LiteralByteStringTest.java
        RopeByteStringSubstringTest.java
        RopeByteStringTest.java
        SpeedUnitTest.java
        geometry
        AbstractAreaTest.java
        AreaTest.java
        BoundingBoxTest.java
        EllipseTest.java
        PolygonTest.java
        PositionTest.java
        PositionTimeTest.java
        RectangleTest.java
        units
        DistanceUnitTest.java
- mc-mms
  - distribution
    - mc-mms-client
      - src
        main
        java
        JavadocDummy.java
    - mc-mms-client-android
      - src
        main
        java
        net
        maritimecloud
        internal
        net
        client
        connection
        ConnectionTransportManagerAndroid.java
    - mc-mms-client-javaee
      - src
        main
        java
        JavadocDummy.java
    - mc-mms-server-standalone
      - src
        main
        java
        JavadocDummy.java
  - mc-mms-client-api
    - src
      - main
        java
        net
        maritimecloud
        net
        mms
        MmsBroadcastOptions.java
        MmsClient.java
        MmsClientClosedException.java
        MmsClientConfiguration.java
        MmsClientShutdown.java
        MmsConnection.java
        MmsConnectionClosingCode.java
        MmsConnectionException.java
        MmsEndpointLocator.java
        package-info.java
  - mc-mms-client-impl
    - src
      - main
        java
        net
        maritimecloud
        internal
        mms
        client
        ClientInfo.java
        ConnectionKeepAlive.java
        DefaultMmsClient.java
        MmsThreadManager.java
        broadcast
        BroadcastDeserializer.java
        ClientBroadcastManager.java
        DispatchedBroadcast.java
        SubscriptionSet.java
        connection
        ClientConnection.java
        DefaultMmsConnection.java
        MmsConnectionListenerInvoker.java
        session
        Session.java
        SessionListener.java
        SessionSender.java
        SessionState.java
        SessionStateConnected.java
        SessionStateConnecting.java
        SessionStateDisconnected.java
        SessionStateDisconnecting.java
        TestIt.java
        transport
        ClientTransport.java
        ClientTransportFactory.java
        ClientTransportFactoryJetty.java
        ClientTransportFactoryJsr356.java
        ClientTransportFactoryTomcat.java
        ClientTransportJsr356.java
        ClientTransportListener.java
        ClientTransportListeners.java
        TransportSecurityUtils.java
        endpoint
        ClientEndpointManager.java
        DefaultEndpointInvocator.java
        DefaultEndpointLocator.java
        DefaultEndpointRegistration.java
        RemoteInvocation.java
      - test
        java
        net
        maritimecloud
        internal
        mms
        client
        AbstractClientConnectionTest.java
        MoreAsserts.java
        TestClientEndpoint.java
        TestWebSocketServer.java
        broadcast
        BroadcastFutureTest.java
        BroadcastTest.java
        connection
        AbstractConnectionTest.java
        DisableEnableTest.java
        ListenerTest.java
        OldConnectTest.java
        OldContinuesReconnectTest.java
        OldReconnect2Test.java
        OldReconnectTest.java
        OldReconnectTest3.java
        OldRepeatRule.java
        ReconnectTest.java
        SimpleTest.java
        session
        AbstractSessionTest.java
        CloseTest.java
        ConnectTest.java
        DelegateConnectionListener.java
        ReconnectNewSessionTest.java
        ReconnectTest.java
        SendReceiveMessageTest.java
        transport
        ClientT.java
        ServerT.java
        TestConnectionTransport.java
        endpoint
        EndpointTest.java
        HelloWorldEndpointImpl.java
        mms
        stubs
        AbstractHelloWorldEndpoint.java
        AbstractShipEndpoint.java
        AbstractTestEndpoint.java
        BroadcastTestMessage.java
        GenerateTestStubs.java
        HelloWorldEndpoint.java
        ShipEndpoint.java
        TestEndpoint.java
        TestMessage.java
        net
        mms
        services
        CoreServices.java
        RemoteActor.java
  - mc-mms-common
    - src
      - main
        java
        net
        maritimecloud
        internal
        mms
        messages
        Close.java
        Connected.java
        Hello.java
        PositionReport.java
        Welcome.java
        services
        AbstractClients.java
        AbstractServices.java
        ClientInfo.java
        ClientList.java
        Clients.java
        Services.java
        spi
        MmsMessage.java
        MmsMessageType.java
        transport
        AccessLogManager.java
        net
        endpoint
        EndpointManager.java
        EndpointMirror.java
        messages
        Broadcast.java
        BroadcastAck.java
        BroadcastTarget.java
        MessageHasher.java
        MethodInvoke.java
        MethodInvokeFailure.java
        MethodInvokeResult.java
        util
        DefaultAcknowledgement.java
        DefaultDispatchedMessage.java
        DefaultEndpointInvocationFuture.java
        DefaultMessageHeader.java
        util
        Coverage.java
        MessageStore.java
        StoredMessage.java
        concurrent
        CompletableFuture.java
        CompletionStage.java
        ConcurrentWeakHashSet.java
        CustomConcurrentHashMap.java
  - mc-mms-server
    - src
      - main
        java
        net
        maritimecloud
        mms
        server
        Main.java
        MmsServer.java
        MmsServerConfiguration.java
        MmsServerConnectionBus.java
        ServerEventListener.java
        WebServer.java
        broadcast
        BroadcastListenSubscription.java
        BroadcastSubscriptionSet.java
        ServerBroadcastManager.java
        connection
        client
        Client.java
        ClientInternalState.java
        ClientManager.java
        ClientProperties.java
        ClientReaper.java
        DefaultTransportListener.java
        Session.java
        SessionMessageFuture.java
        transport
        ServerTransport.java
        ServerTransportJsr356Endpoint.java
        ServerTransportListener.java
        endpoints
        ServerClientEndpointManager.java
        ServerEndpointManager.java
        ServerServices.java
        rest
        ClientManagerStatistics.java
        ClientResource.java
        DmaExceptionMapper.java
        EndpointInvoke.java
        JSONMessageBodyWriter.java
        JSONMetricRegistryBodyWriter.java
        MetricsResource.java
        ProtectedResource.java
        TailLogger.java
        TailTargetLog.java
        security
        AuthenticationException.java
        AuthenticationHandler.java
        AuthenticationToken.java
        AuthenticationTokenHandler.java
        BaseSecurityHandler.java
        ClientVerificationException.java
        ClientVerificationHandler.java
        MmsSecurityManager.java
        SslHandler.java
        Subject.java
        impl
        ApacheConfSecurityHandler.java
        BasicAuthAuthenticationTokenHandler.java
        ClientCertAuthenticationTokenHandler.java
        DefaultSslHandler.java
        FixedConfSecurityHandler.java
        JwtAuthenticationTokenHandler.java
        LdapSecurityHandler.java
        UsernamePasswordToken.java
        tracker
        PositionTracker.java
        PositionUpdatedHandler.java
        Subscription.java
      - test
        java
        net
        maritimecloud
        server
        AbstractServerConnectionTest.java
        BroadcastSender.java
        TesstEndpoint.java
        broadcast
        BroadcastReceiverAck.java
        BroadcastTest.java
        connection
        CloseTest.java
        Connect2Test.java
        ConnectTest.java
        IdGenerationTest.java
        ReconnectTest.java
        Test1000.java
        endpoint
        EndpointTest.java
        security
        ApacheSecurityTest.java
        AuthenticationTokenTest.java
  - mc-mms-tck
    - src
      - main
        java
        net
        maritimecloud
        mms
        evil
        PingPongTest.java
        Tester.java
        tck
        stubs
        AbstractTestEndpoint.java
        GenerateTestClasses.java
        TestEndpoint.java
        tests
        AbstractNetworkTest.java
        ConnectionStateListenerTest.java
        ConnectionTest.java
        NetworkFuturesOnCloseTest.java
        ProperDisconnectTest.java
        ReconnectTest.java
        SameIDConnectTest.java
        broadcast
        BroadcastTest.java
        server
        CustomPortTest.java
        StartStopServerTest.java
        service
        AbstractServiceTest.java
        ServiceFindTest.java
        ServiceTest.java
        test
        util
        ProxyTester.java
        SocketProxy.java
      - test
        java
        net
        maritimecloud
        mms
        tests
        endpoint
        EndpointTest.java
        InvokeRemoteEndpointMethodTest.java
- mc-msdl
  - mc-msdl-core
    - src
      - main
        java
        net
        maritimecloud
        internal
        msdl
        db
        DefaultMsdlDatabase.java
        Directory.java
        MsdlDatabaseConfiguration.java
        TestIt.java
        Visitor.java
        dynamic
        AbstractAsynchronousDynamicEndpointImplementation.java
        AbstractDynamicEndpointImplementation.java
        DynamicBroadcastMessage.java
        DynamicEnum.java
        DynamicMessage.java
        parser
        AbstractContainer.java
        AbstractFieldOrArgument.java
        AnnotationContainer.java
        Checks.java
        ImportResolver.java
        MsdlComment.java
        ParsedBroadcastMessage.java
        ParsedEndpoint.java
        ParsedEndpointFunction.java
        ParsedEndpointFunctionArgument.java
        ParsedEnum.java
        ParsedField.java
        ParsedMessage.java
        ParsedMsdlFile.java
        ParsedProject.java
        ParsedType.java
        SourceTagHolder.java
        TypeResolver.java
        antlr
        AntlrFile.java
        ReservedWords.java
        StringUtil.java
        generated
        MsdlLexer.java
        MsdlParser.java
        old
        DefaultSourceToken.java
        ParserLogger.java
        msdl
        MsdlLogger.java
        MsdlPlugin.java
        MsdlPluginException.java
        MsdlProcessor.java
        MsdlProcessorResult.java
        model
        Annotatable.java
        BaseMessage.java
        BaseType.java
        BroadcastMessageDeclaration.java
        CommentDeclaration.java
        EndpointDefinition.java
        EndpointMethod.java
        EnumDeclaration.java
        FieldOrParameter.java
        ListOrSetType.java
        MapType.java
        MessageDeclaration.java
        MsdlFile.java
        Project.java
        SourceToken.java
        Type.java
        package-info.java
        package-info.java
      - test
        java
        net
        maritimecloud
        msdl
        parser
        AbstractParserTest.java
        BuildinTypes.java
        EnumParserTest.java
        ImportTest.java
        MessageExceptionsTest.java
        MessageParserTest.java
        TestFs.java
        TestLogger.java
  - mc-msdl-javagenerator
    - src
      - main
        java
        net
        maritimecloud
        msdl
        plugins
        javagen
        JavaGenBroadcastMessageGenerator.java
        JavaGenEndpointGenerator.java
        JavaGenEnumGenerator.java
        JavaGenMessageGenerator.java
        JavaGenMessageImmutableGenerator.java
        JavaGenPlugin.java
        JavaGenType.java
        annotation
        JavaImplementation.java
        JavaImplements.java
        rest
        GET.java
  - mc-msdl-maven-plugin
    - src
      - main
        java
        net
        maritimecloud
        internal
        msdl
        compiler
        mavenplugin
        AbstractMsdlMojo.java
        AdaptedMsdlLogger.java
        FileTools.java
        MsdlGeneratorMojo.java
  - mc-msdl-testproject
    - src
      - test
        java
        net
        maritimecloud
        msdl
        testproject
        B1Test.java
        GeometryTest.java

/* Copyright (c) 2011 Danish Maritime Authority.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

// Protocol Buffers - Google's data interchange format
// Copyright 2008 Google Inc.  All rights reserved.
// http://code.google.com/p/protobuf/
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
//     * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//     * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
//     * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

package net.maritimecloud.util;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertSame;
import static org.junit.Assert.assertTrue;
import static org.junit.Assert.fail;

import java.io.UnsupportedEncodingException;
import java.nio.ByteBuffer;
import java.nio.CharBuffer;
import java.nio.charset.Charset;
import java.nio.charset.CharsetDecoder;
import java.nio.charset.CharsetEncoder;
import java.nio.charset.CoderResult;
import java.nio.charset.CodingErrorAction;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
import java.util.Random;
import java.util.logging.Logger;

/**
 * Shared testing code for {@link IsValidUtf8Test} and {@link IsValidUtf8Test}.
 *
 * @author jonp@google.com (Jon Perlow)
 * @author martinrb@google.com (Martin Buchholz)
 */
// CHECKSTYLE:OFF
class IsValidUtf8TestUtil {
    private static Logger logger = Logger.getLogger(IsValidUtf8TestUtil.class.getName());

    // 128 - [chars 0x0000 to 0x007f]
    static long ONE_BYTE_ROUNDTRIPPABLE_CHARACTERS = 0x007f - 0x0000 + 1;

    // 128
    static long EXPECTED_ONE_BYTE_ROUNDTRIPPABLE_COUNT = ONE_BYTE_ROUNDTRIPPABLE_CHARACTERS;

    // 1920 [chars 0x0080 to 0x07FF]
    static long TWO_BYTE_ROUNDTRIPPABLE_CHARACTERS = 0x07FF - 0x0080 + 1;

    // 18,304
    static long EXPECTED_TWO_BYTE_ROUNDTRIPPABLE_COUNT =
            // Both bytes are one byte characters
            (long) Math.pow(EXPECTED_ONE_BYTE_ROUNDTRIPPABLE_COUNT, 2) +
            // The possible number of two byte characters
            TWO_BYTE_ROUNDTRIPPABLE_CHARACTERS;

    // 2048
    static long THREE_BYTE_SURROGATES = 2 * 1024;

    // 61,440 [chars 0x0800 to 0xFFFF, minus surrogates]
    static long THREE_BYTE_ROUNDTRIPPABLE_CHARACTERS = 0xFFFF - 0x0800 + 1 - THREE_BYTE_SURROGATES;

    // 2,650,112
    static long EXPECTED_THREE_BYTE_ROUNDTRIPPABLE_COUNT =
            // All one byte characters
            (long) Math.pow(EXPECTED_ONE_BYTE_ROUNDTRIPPABLE_COUNT, 3) +
            // One two byte character and a one byte character
            2 * TWO_BYTE_ROUNDTRIPPABLE_CHARACTERS * ONE_BYTE_ROUNDTRIPPABLE_CHARACTERS +
            // Three byte characters
            THREE_BYTE_ROUNDTRIPPABLE_CHARACTERS;

    // 1,048,576 [chars 0x10000L to 0x10FFFF]
    static long FOUR_BYTE_ROUNDTRIPPABLE_CHARACTERS = 0x10FFFF - 0x10000L + 1;

    // 289,571,839
    static long EXPECTED_FOUR_BYTE_ROUNDTRIPPABLE_COUNT =
            // All one byte characters
            (long) Math.pow(EXPECTED_ONE_BYTE_ROUNDTRIPPABLE_COUNT, 4)
            +
            // One and three byte characters
            2 * THREE_BYTE_ROUNDTRIPPABLE_CHARACTERS * ONE_BYTE_ROUNDTRIPPABLE_CHARACTERS
            +
            // Two two byte characters
            TWO_BYTE_ROUNDTRIPPABLE_CHARACTERS * TWO_BYTE_ROUNDTRIPPABLE_CHARACTERS
            +
            // Permutations of one and two byte characters
            3 * TWO_BYTE_ROUNDTRIPPABLE_CHARACTERS * ONE_BYTE_ROUNDTRIPPABLE_CHARACTERS
            * ONE_BYTE_ROUNDTRIPPABLE_CHARACTERS +
            // Four byte characters
            FOUR_BYTE_ROUNDTRIPPABLE_CHARACTERS;

    static final long[] FOUR_BYTE_SHARDS_EXPECTED_ROUNTRIPPABLES = generateFourByteShardsExpectedRunnables();

    private static long[] generateFourByteShardsExpectedRunnables() {
        long[] expected = new long[128];

        // 0-63 are all 5300224
        for (int i = 0; i <= 63; i++) {
            expected[i] = 5300224;
        }

        // 97-111 are all 2342912
        for (int i = 97; i <= 111; i++) {
            expected[i] = 2342912;
        }

        // 113-117 are all 1048576
        for (int i = 113; i <= 117; i++) {
            expected[i] = 1048576;
        }

        // One offs
        expected[112] = 786432;
        expected[118] = 786432;
        expected[119] = 1048576;
        expected[120] = 458752;
        expected[121] = 524288;
        expected[122] = 65536;

        // Anything not assigned was the default 0.
        return expected;
    }

    static final List<Shard> FOUR_BYTE_SHARDS = generateFourByteShards(128, FOUR_BYTE_SHARDS_EXPECTED_ROUNTRIPPABLES);


    private static List<Shard> generateFourByteShards(int numShards, long[] expected) {
        assertEquals(numShards, expected.length);
        List<Shard> shards = new ArrayList<>(numShards);
        long LIM = 1L << 32;
        long increment = LIM / numShards;
        assertTrue(LIM % numShards == 0);
        for (int i = 0; i < numShards; i++) {
            shards.add(new Shard(i, increment * i, increment * (i + 1), expected[i]));
        }
        return shards;
    }

    /**
     * Helper to run the loop to test all the permutations for the number of bytes specified.
     *
     * @param numBytes
     *            the number of bytes in the byte array
     * @param expectedCount
     *            the expected number of roundtrippable permutations
     */
    static void testBytes(int numBytes, long expectedCount) throws UnsupportedEncodingException {
        testBytes(numBytes, expectedCount, 0, -1);
    }

    /**
     * Helper to run the loop to test all the permutations for the number of bytes specified. This overload is useful
     * for debugging to get the loop to start at a certain character.
     *
     * @param numBytes
     *            the number of bytes in the byte array
     * @param expectedCount
     *            the expected number of roundtrippable permutations
     * @param start
     *            the starting bytes encoded as a long as big-endian
     * @param lim
     *            the limit of bytes to process encoded as a long as big-endian, or -1 to mean the max limit for
     *            numBytes
     */
    static void testBytes(int numBytes, long expectedCount, long start, long lim) throws UnsupportedEncodingException {
        Random rnd = new Random();
        byte[] bytes = new byte[numBytes];

        if (lim == -1) {
            lim = 1L << numBytes * 8;
        }
        long count = 0;
        long countRoundTripped = 0;
        for (long byteChar = start; byteChar < lim; byteChar++) {
            long tmpByteChar = byteChar;
            for (int i = 0; i < numBytes; i++) {
                bytes[bytes.length - i - 1] = (byte) tmpByteChar;
                tmpByteChar = tmpByteChar >> 8;
            }
            Binary bs = Binary.copyFrom(bytes);
            boolean isRoundTrippable = bs.isValidUtf8();
            String s = new String(bytes, "UTF-8");
            byte[] bytesReencoded = s.getBytes("UTF-8");
            boolean bytesEqual = Arrays.equals(bytes, bytesReencoded);

            if (bytesEqual != isRoundTrippable) {
                outputFailure(byteChar, bytes, bytesReencoded);
            }

            // Check agreement with static Utf8 methods.
            assertEquals(isRoundTrippable, Utf8.isValidUtf8(bytes));
            assertEquals(isRoundTrippable, Utf8.isValidUtf8(bytes, 0, numBytes));

            // Test partial sequences.
            // Partition numBytes into three segments (not necessarily non-empty).
            int i = rnd.nextInt(numBytes);
            int j = rnd.nextInt(numBytes);
            if (j < i) {
                int tmp = i;
                i = j;
                j = tmp;
            }
            int state1 = Utf8.partialIsValidUtf8(Utf8.COMPLETE, bytes, 0, i);
            int state2 = Utf8.partialIsValidUtf8(state1, bytes, i, j);
            int state3 = Utf8.partialIsValidUtf8(state2, bytes, j, numBytes);
            if (isRoundTrippable != (state3 == Utf8.COMPLETE)) {
                System.out.printf("state=%04x %04x %04x i=%d j=%d%n", state1, state2, state3, i, j);
                outputFailure(byteChar, bytes, bytesReencoded);
            }
            assertEquals(isRoundTrippable, state3 == Utf8.COMPLETE);

            // Test ropes built out of small partial sequences
            Binary rope = RopeBinary.newInstanceForTest(bs.substring(0, i),
                    RopeBinary.newInstanceForTest(bs.substring(i, j), bs.substring(j, numBytes)));
            assertSame(RopeBinary.class, rope.getClass());

            Binary[] byteStrings = { bs, bs.substring(0, numBytes), rope };
            for (Binary x : byteStrings) {
                assertEquals(isRoundTrippable, x.isValidUtf8());
                assertEquals(state3, x.partialIsValidUtf8(Utf8.COMPLETE, 0, numBytes));

                assertEquals(state1, x.partialIsValidUtf8(Utf8.COMPLETE, 0, i));
                assertEquals(state1, x.substring(0, i).partialIsValidUtf8(Utf8.COMPLETE, 0, i));
                assertEquals(state2, x.partialIsValidUtf8(state1, i, j - i));
                assertEquals(state2, x.substring(i, j).partialIsValidUtf8(state1, 0, j - i));
                assertEquals(state3, x.partialIsValidUtf8(state2, j, numBytes - j));
                assertEquals(state3, x.substring(j, numBytes).partialIsValidUtf8(state2, 0, numBytes - j));
            }

            // ByteString reduplication should not affect its UTF-8 validity.
            Binary ropeADope = RopeBinary.newInstanceForTest(bs, bs.substring(0, numBytes));
            assertEquals(isRoundTrippable, ropeADope.isValidUtf8());

            if (isRoundTrippable) {
                countRoundTripped++;
            }
            count++;
            if (byteChar != 0 && byteChar % 1000000L == 0) {
                logger.info("Processed " + byteChar / 1000000L + " million characters");
            }
        }
        logger.info("Round tripped " + countRoundTripped + " of " + count);
        assertEquals(expectedCount, countRoundTripped);
    }

    /**
     * Variation of {@link #testBytes} that does less allocation using the low-level encoders/decoders directly. Checked
     * in because it's useful for debugging when trying to process bytes faster, but since it doesn't use the actual
     * String class, it's possible for incompatibilities to develop (although unlikely).
     *
     * @param numBytes
     *            the number of bytes in the byte array
     * @param expectedCount
     *            the expected number of roundtrippable permutations
     * @param start
     *            the starting bytes encoded as a long as big-endian
     * @param lim
     *            the limit of bytes to process encoded as a long as big-endian, or -1 to mean the max limit for
     *            numBytes
     */
    void testBytesUsingByteBuffers(int numBytes, long expectedCount, long start, long lim) {
        CharsetDecoder decoder = Charset.forName("UTF-8").newDecoder().onMalformedInput(CodingErrorAction.REPLACE)
                .onUnmappableCharacter(CodingErrorAction.REPLACE);
        CharsetEncoder encoder = Charset.forName("UTF-8").newEncoder().onMalformedInput(CodingErrorAction.REPLACE)
                .onUnmappableCharacter(CodingErrorAction.REPLACE);
        byte[] bytes = new byte[numBytes];
        int maxChars = (int) (decoder.maxCharsPerByte() * numBytes) + 1;
        char[] charsDecoded = new char[(int) (decoder.maxCharsPerByte() * numBytes) + 1];
        int maxBytes = (int) (encoder.maxBytesPerChar() * maxChars) + 1;
        byte[] bytesReencoded = new byte[maxBytes];

        ByteBuffer bb = ByteBuffer.wrap(bytes);
        CharBuffer cb = CharBuffer.wrap(charsDecoded);
        ByteBuffer bbReencoded = ByteBuffer.wrap(bytesReencoded);
        if (lim == -1) {
            lim = 1L << numBytes * 8;
        }
        long count = 0;
        long countRoundTripped = 0;
        for (long byteChar = start; byteChar < lim; byteChar++) {
            bb.rewind();
            bb.limit(bytes.length);
            cb.rewind();
            cb.limit(charsDecoded.length);
            bbReencoded.rewind();
            bbReencoded.limit(bytesReencoded.length);
            encoder.reset();
            decoder.reset();
            long tmpByteChar = byteChar;
            for (int i = 0; i < bytes.length; i++) {
                bytes[bytes.length - i - 1] = (byte) tmpByteChar;
                tmpByteChar = tmpByteChar >> 8;
            }
            boolean isRoundTrippable = Binary.copyFrom(bytes).isValidUtf8();
            CoderResult result = decoder.decode(bb, cb, true);
            assertFalse(result.isError());
            result = decoder.flush(cb);
            assertFalse(result.isError());

            int charLen = cb.position();
            cb.rewind();
            cb.limit(charLen);
            result = encoder.encode(cb, bbReencoded, true);
            assertFalse(result.isError());
            result = encoder.flush(bbReencoded);
            assertFalse(result.isError());

            boolean bytesEqual = true;
            int bytesLen = bbReencoded.position();
            if (bytesLen != numBytes) {
                bytesEqual = false;
            } else {
                for (int i = 0; i < numBytes; i++) {
                    if (bytes[i] != bytesReencoded[i]) {
                        bytesEqual = false;
                        break;
                    }
                }
            }
            if (bytesEqual != isRoundTrippable) {
                outputFailure(byteChar, bytes, bytesReencoded, bytesLen);
            }

            count++;
            if (isRoundTrippable) {
                countRoundTripped++;
            }
            if (byteChar != 0 && byteChar % 1000000 == 0) {
                logger.info("Processed " + byteChar / 1000000 + " million characters");
            }
        }
        logger.info("Round tripped " + countRoundTripped + " of " + count);
        assertEquals(expectedCount, countRoundTripped);
    }

    private static void outputFailure(long byteChar, byte[] bytes, byte[] after) {
        outputFailure(byteChar, bytes, after, after.length);
    }

    private static void outputFailure(long byteChar, byte[] bytes, byte[] after, int len) {
        fail("Failure: (" + Long.toHexString(byteChar) + ") " + toHexString(bytes) + " => " + toHexString(after, len));
    }

    private static String toHexString(byte[] b) {
        return toHexString(b, b.length);
    }

    private static String toHexString(byte[] b, int len) {
        StringBuilder s = new StringBuilder();
        s.append("\"");
        for (int i = 0; i < len; i++) {
            if (i > 0) {
                s.append(" ");
            }
            s.append(String.format("%02x", b[i] & 0xFF));
        }
        s.append("\"");
        return s.toString();
    }


    static class Shard {
        final long index;

        final long start;

        final long lim;

        final long expected;


        public Shard(long index, long start, long lim, long expected) {
            assertTrue(start < lim);
            this.index = index;
            this.start = start;
            this.lim = lim;
            this.expected = expected;
        }
    }

}
// CHECKSTYLE:ON