CSVFormat.java example

Explorer

motherbrain-master
- src
  - com
    - zillabyte
      - motherbrain
        api
        APIException.java
        APIService.java
        LocalAPIService.java
        RelationsHelper.java
        RestAPIHelper.java
        benchmarking
        Benchmark.java
        BenchmarkFactory.java
        GraphiteBenchmarker.java
        MovingBenchmarker.java
        NoopBenchmarker.java
        StderrBenchmarker.java
        container
        Container.java
        ContainerCacher.java
        ContainerEnvironmentHelper.java
        ContainerException.java
        ContainerExecuteBuilder.java
        ContainerFactory.java
        ContainerPathHelper.java
        ContainerSerializer.java
        ContainerWrapper.java
        NoopRemoteContainerCleaner.java
        PipeGateway.java
        RemoteContainerCleaner.java
        TcpSocketHelper.java
        UnixSocketHelper.java
        local
        InplaceContainer.java
        InplaceContainerFactory.java
        InplaceSerializer.java
        coordination
        AskHandler.java
        AskWrapper.java
        CoordinationException.java
        CoordinationService.java
        CoordinationServiceWrapper.java
        Lock.java
        MessageHandler.java
        RemoteCoordinationException.java
        Watcher.java
        mock
        MockStateService.java
        redis
        RedisException.java
        TransactionalMessageWrapper.java
        flow
        ActionTimeoutException.java
        App.java
        Component.java
        EndCyclePolicy.java
        Fields.java
        Flow.java
        FlowCompilationException.java
        FlowException.java
        FlowInstance.java
        FlowInstanceSetBuilder.java
        FlowInstanceWrapper.java
        FlowOperationInstance.java
        FlowOperationInstanceCollection.java
        FlowRecoveryException.java
        FlowService.java
        FlowState.java
        FlowStateCoordinator.java
        FlowStateException.java
        MapTuple.java
        StateMachine.java
        StateMachineException.java
        StateMachineHelper.java
        StreamBuilder.java
        aggregation
        AggregationException.java
        AggregationKey.java
        AggregationStore.java
        AggregationStoreFactory.java
        AggregationStoreWrapper.java
        Aggregator.java
        CachedStore.java
        CachedStoreFactory.java
        DefaultAggregationStoreFactory.java
        DiskBackedStore.java
        FlowAggregationSplitter.java
        MemoryStore.java
        MemoryStoreFactory.java
        PartialAggregator.java
        StoreType.java
        TuplePage.java
        buffer
        BufferClientFactory.java
        BufferConsumer.java
        BufferFlusher.java
        BufferProducer.java
        BufferService.java
        SinkToBuffer.java
        SourceFromBuffer.java
        mock
        LocalBufferClientFactory.java
        LocalBufferConsumer.java
        LocalBufferProducer.java
        LocalDevBufferClientFactory.java
        LocalDevBufferFlusher.java
        LocalDevBufferProducer.java
        MockBufferProducer.java
        MockBufferService.java
        collectors
        OutputCollector.java
        coordinated
        AckTuple.java
        BaseCoordTuple.java
        BatchCompleteAckTuple.java
        BatchCompleteTuple.java
        BatchState.java
        BatchTracker.java
        BatchedTuple.java
        CoordTupleOptions.java
        CoordinatedOutputCollector.java
        DeadNodeDetectedException.java
        ExplicitAckRequestTuple.java
        MaxIterationsExceededException.java
        ObserveIncomingTupleAction.java
        PingTuple.java
        PongTuple.java
        QueuedTuple.java
        support
        CoordinatedOutputCollectorSupportFactory.java
        EmptyTupleIdSet.java
        FailedTupleHandler.java
        TupleIdGenerator.java
        TupleIdMapper.java
        TupleIdSet.java
        naive
        DoNothingFailedTupleHandler.java
        NaiveCoordinatedOutputCollectorSupportFactory.java
        SerialTupleIdGenerator.java
        UncompressedTupleIdMapper.java
        UncompressedTupleIdSet.java
        components
        ComponentInput.java
        ComponentOutput.java
        builtin
        BuiltinComponents.java
        FetchUrlComponent.java
        config
        FlowConfig.java
        OperationConfig.java
        UserConfig.java
        error
        strategies
        ErrorStrategyFactory.java
        ErrorThresholdExceededException.java
        FakeLocalException.java
        FlowErrorStrategy.java
        ForgivingFlowErrorStrategy.java
        OperationErrorStrategy.java
        PassiveWorkerPercentageAndAbsoluteOperationErrorStrategy.java
        StrictFlowErrorStrategy.java
        WorkerThrowsErrorPercentageAndAbsoluteOperationErrorStrategy.java
        graph
        Connection.java
        FlowGraph.java
        heartbeats
        Heartbeat.java
        HeartbeatException.java
        local
        LocalFlowController.java
        LocalFlowOutputCollector.java
        LocalFlowService.java
        LocalOperationSlot.java
        operations
        AggregationOperation.java
        AggregationState.java
        Function.java
        FunctionState.java
        GroupBy.java
        Join.java
        JoinType.java
        MockOperationLogger.java
        Operation.java
        OperationDeadException.java
        OperationException.java
        OperationLogger.java
        OperationLoggerException.java
        OperationMessage.java
        OperationSleeper.java
        ProcessableOperation.java
        Sink.java
        SinkState.java
        Source.java
        SourceState.java
        builtin
        Clumper.java
        Count.java
        RateLimiter.java
        Unique.java
        decorators
        EmitDecorator.java
        RemoveFields.java
        RenameFields.java
        RetainFields.java
        multilang
        MultiLangCleaner.java
        MultiLangErrorHandler.java
        MultiLangException.java
        MultiLangLogHandler.java
        MultiLangMessageHandler.java
        MultiLangProcess.java
        MultiLangProcessDiedUnexpectedlyException.java
        MultiLangProcessException.java
        MultiLangProcessGeneralOperationObserver.java
        MultiLangProcessStartupLogObserver.java
        MultiLangProcessTupleObserver.java
        builder
        APIFlowBuilder.java
        APIFlowBuilderFactory.java
        FlowBuilderFactory.java
        FlowFetcher.java
        FlowValidator.java
        InplaceFlowBuilder.java
        InplaceFlowBuilderFactory.java
        MultilangFlowCompiler.java
        PlaceHolderOperation.java
        RouteBy.java
        operations
        LocalComponent.java
        MultiLangAggregator.java
        MultiLangOperation.java
        MultiLangRunEach.java
        MultiLangRunSource.java
        MultilangClumper.java
        MultilangHandler.java
        rpc
        RPCHelper.java
        RPCRequest.java
        RPCResponse.java
        RPCSink.java
        RPCSource.java
        queues
        InputQueue.java
        MockQueueFactory.java
        OutputQueue.java
        QueueFactory.java
        sourcefromrelation
        ShardReader.java
        ShardType.java
        tests
        helpers
        MockInstanceHelper.java
        metrics
        Metrics.java
        MockMetrics.java
        reactor
        lightweight
        ProcessTimeoutException.java
        relational
        APIRelationDefFactory.java
        AliasedQuery.java
        BufferQuery.java
        ColumnDef.java
        DataType.java
        DefaultStreamException.java
        MissingFieldException.java
        Query.java
        RelationBackend.java
        RelationDef.java
        RelationDefFactory.java
        RelationException.java
        S3OnlyQuery.java
        StreamMarker.java
        StreamReader.java
        UnexpectedFieldException.java
        naivepostgresimpl
        NaivePostgresStreamMarker.java
        redshiftimpl
        RedshiftStreamMarker.java
        RedshiftStreamReader.java
        shell
        LocalOsxShellFactory.java
        MachineType.java
        ShellFactory.java
        UbuntuEc2ShellFactory.java
        UbuntuTeamCityShellFactory.java
        UbuntuVagrantShellFactory.java
        state
        package-info.java
        top
        BasicTopService.java
        CommandLine.java
        LocalCommandLineHelper.java
        LocalServiceMain.java
        MotherbrainException.java
        MotherbrainRuntimeException.java
        TopService.java
        universe
        Config.java
        Environment.java
        ExceptionHandler.java
        ExpectedConfigNotPresent.java
        FileFactory.java
        FileFactoryException.java
        LocalUniverseBuilder.java
        LoggerFactory.java
        MockConfig.java
        S3Exception.java
        SSHException.java
        SSHFactory.java
        Universe.java
        UniverseBuilder.java
        utils
        ByteArrayWrapper.java
        CompressUtils.java
        DateHelper.java
        ExceptionAttempt.java
        FileLockUtil.java
        Glob.java
        JSONUtil.java
        JarCompilationException.java
        Log4jWrapper.java
        MapBuilder.java
        MeteredLog.java
        SerializableMonitor.java
        UrlHelper.java
        Utils.java
        VersionComparer.java
        backoff
        BackoffTicker.java
        ExponentialBackoffTicker.java
        csv
        Assertions.java
        CSVFormat.java
        CSVParser.java
        CSVPrinter.java
        CSVRecord.java
        Constants.java
        ExtendedBufferedReader.java
        Lexer.java
        Quote.java
        Token.java
        package-info.java
        dfs
        DFSService.java
        DFSServiceWrapper.java
        LocalDFSService.java
        queue
        ByteSizable.java

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.zillabyte.motherbrain.utils.csv;

import static com.zillabyte.motherbrain.utils.csv.Constants.BACKSLASH;
import static com.zillabyte.motherbrain.utils.csv.Constants.COMMA;
import static com.zillabyte.motherbrain.utils.csv.Constants.CR;
import static com.zillabyte.motherbrain.utils.csv.Constants.CRLF;
import static com.zillabyte.motherbrain.utils.csv.Constants.DOUBLE_QUOTE_CHAR;
import static com.zillabyte.motherbrain.utils.csv.Constants.LF;
import static com.zillabyte.motherbrain.utils.csv.Constants.TAB;

import java.io.IOException;
import java.io.Reader;
import java.io.Serializable;
import java.io.StringWriter;
import java.util.Arrays;
import java.util.HashSet;
import java.util.Set;

/**
 * Specifies the format of a CSV file and parses input.
 *
 * <h2>Using predefined formats</h2>
 *
 * <p>
 * You can use one of the predefined formats:
 * </p>
 *
 * <ul>
 *      <li>{@link #DEFAULT}</li>
 *      <li>{@link #EXCEL}</li>
 *      <li>{@link #MYSQL}</li>
 *      <li>{@link #RFC4180}</li>
 *      <li>{@link #TDF}</li>
 * </ul>
 *
 * <p>
 * For example:
 * </p>
 *
 * <pre>
 * CSVParser parser = CSVFormat.EXCEL.parse(reader);
 * </pre>
 *
 * <p>
 * The {@link CSVParser} provides static methods to parse other input types, for example:
 * </p>
 *
 * <pre>CSVParser parser = CSVParser.parse(file, StandardCharsets.US_ASCII, CSVFormat.EXCEL);</pre>
 *
 * <h2>Defining formats</h2>
 *
 * <p>
 * You can extend a format by calling the {@code with} methods. For example:
 * </p>
 *
 * <pre>
 * CSVFormat.EXCEL
 *   .withNullString("N/A")
 *   .withIgnoreSurroundingSpaces(true);
 * </pre>
 *
 * <h2>Defining column names</h2>
 *
 * <p>
 * To define the column names you want to use to access records, write:
 * </p>
 *
 * <pre>
 * CSVFormat.EXCEL.withHeader("Col1", "Col2", "Col3");
 * </pre>
 *
 * <p>
 * Calling {@link #withHeader(String...)} let's you use the given names to address values in a {@link CSVRecord}, and
 * assumes that your CSV source does not contain a first record that also defines column names.
 *
 * If it does, then you are overriding this metadata with your names and you should skip the first record by calling
 * {@link #withSkipHeaderRecord(boolean)} with {@code true}.
 * </p>
 *
 * <h2>Parsing</h2>
 *
 * <p>
 * You can use a format directly to parse a reader. For example, to parse an Excel file with columns header, write:
 * </p>
 *
 * <pre>
 * Reader in = ...;
 * CSVFormat.EXCEL.withHeader("Col1", "Col2", "Col3").parse(in);
 * </pre>
 *
 * <p>
 * For other input types, like resources, files, and URLs, use the static methods on {@link CSVParser}.
 * </p>
 *
 * <h2>Referencing columns safely</h2>
 *
 * <p>
 * If your source contains a header record, you can simplify your code and safely reference columns,
 * by using {@link #withHeader(String...)} with no arguments:
 * </p>
 *
 * <pre>
 * CSVFormat.EXCEL.withHeader();
 * </pre>
 *
 * <p>
 * This causes the parser to read the first record and use its values as column names.
 *
 * Then, call one of the {@link CSVRecord} get method that takes a String column name argument:
 * </p>
 *
 * <pre>
 * String value = record.get("Col1");
 * </pre>
 *
 * <p>
 * This makes your code impervious to changes in column order in the CSV file.
 * </p>
 *
 * <h2>Notes</h2>
 *
 * <p>
 * This class is immutable.
 * </p>
 *
 * @version $Id: CSVFormat.java 1610494 2014-07-14 19:34:56Z britter $
 */
public final class CSVFormat implements Serializable {

    private static final long serialVersionUID = 1L;

    private final char delimiter;
    private final Character quoteChar; // null if quoting is disabled
    private final Quote quotePolicy;
    private final Character commentStart; // null if commenting is disabled
    private final Character escape; // null if escaping is disabled
    private final boolean ignoreSurroundingSpaces; // Should leading/trailing spaces be ignored around values?
    private final boolean ignoreEmptyHeaders;
    private final boolean ignoreEmptyLines;
    private final String recordSeparator; // for outputs
    private final String nullString; // the string to be used for null values
    private final String[] header; // array of header column names
    private final boolean skipHeaderRecord;

    /**
     * Standard comma separated format, as for {@link #RFC4180} but allowing empty lines.
     *
     * <p>Settings are:
     * <ul>
     *   <li>withDelimiter(',')</li>
     *   <li>withQuoteChar('"')</li>
     *   <li>withRecordSeparator("\r\n")</li>
     *   <li>withIgnoreEmptyLines(true)</li>
     * </ul>
     * </p>
     */
    public static final CSVFormat DEFAULT = new CSVFormat(COMMA, DOUBLE_QUOTE_CHAR, null, null, null,
                                                            false, true, CRLF, null, null, false, false);

    /**
     * Comma separated format as defined by <a href="http://tools.ietf.org/html/rfc4180">RFC 4180</a>.
     *
     * <p>Settings are:
     * <ul>
     *   <li>withDelimiter(',')</li>
     *   <li>withQuoteChar('"')</li>
     *   <li>withRecordSeparator("\r\n")</li>
     *   <li>withIgnoreEmptyLines(false)</li>
     * </ul>
     * </p>
     */
    public static final CSVFormat RFC4180 = DEFAULT.withIgnoreEmptyLines(false);

    /**
     * Excel file format (using a comma as the value delimiter). Note that the actual value delimiter used by Excel is
     * locale dependent, it might be necessary to customize this format to accommodate to your regional settings.
     *
     * <p>
     * For example for parsing or generating a CSV file on a French system the following format will be used:
     * </p>
     *
     * <pre>
     * CSVFormat fmt = CSVFormat.EXCEL.withDelimiter(';');
     * </pre>
     *
     * <p>
     * Settings are:
     * <ul>
     *   <li>withDelimiter(',')</li>
     *   <li>withQuoteChar('"')</li>
     *   <li>withRecordSeparator("\r\n")</li>
     *   <li>withIgnoreEmptyLines(false)</li>
     * </ul>
     * </p>
     * <p>
     * Note: this is currently the same as {@link #RFC4180}.
     * </p>
     */
    public static final CSVFormat EXCEL = DEFAULT.withIgnoreEmptyLines(false);

    /**
     * Tab-delimited format.
     *
     * <p>Settings are:
     * <ul>
     *   <li>withDelimiter('\t')</li>
     *   <li>withQuoteChar('"')</li>
     *   <li>withRecordSeparator("\r\n")</li>
     *   <li>withIgnoreSurroundingSpaces(true)</li>
     * </ul>
     * </p>
     */
    public static final CSVFormat TDF =
            DEFAULT
            .withDelimiter(TAB)
            .withIgnoreSurroundingSpaces(true);

    /**
     * Default MySQL format used by the <tt>SELECT INTO OUTFILE</tt> and <tt>LOAD DATA INFILE</tt> operations.
     *
     * <p>
     * This is a tab-delimited format with a LF character as the line separator. Values are not quoted and special characters
     * are escaped with '\'.
     * </p>
     *
     * <p>
     * Settings are:
     * <ul>
     *   <li>withDelimiter('\t')</li>
     *   <li>withQuoteChar(null)</li>
     *   <li>withRecordSeparator('\n')</li>
     *   <li>withIgnoreEmptyLines(false)</li>
     *   <li>withEscape('\\')</li>
     * </ul>
     * </p>
     * @see <a href="http://dev.mysql.com/doc/refman/5.1/en/load-data.html">
     *      http://dev.mysql.com/doc/refman/5.1/en/load-data.html</a>
     */
    public static final CSVFormat MYSQL =
            DEFAULT
            .withDelimiter(TAB)
            .withEscape(BACKSLASH)
            .withIgnoreEmptyLines(false)
            .withQuoteChar(null)
            .withRecordSeparator(LF);

    /**
     * Returns true if the given character is a line break character.
     *
     * @param c
     *            the character to check
     *
     * @return true if <code>c</code> is a line break character
     */
    private static boolean isLineBreak(final char c) {
        return c == LF || c == CR;
    }

    /**
     * Returns true if the given character is a line break character.
     *
     * @param c
     *            the character to check, may be null
     *
     * @return true if <code>c</code> is a line break character (and not null)
     */
    private static boolean isLineBreak(final Character c) {
        return c != null && isLineBreak(c.charValue());
    }

    /**
     * Creates a new CSV format with the specified delimiter.
     *
     * <p>Use this method if you want to create a CSVFormat from scratch. All fields but the delimiter will be
     * initialized with null/false.</p>
     *
     * @param delimiter
     *            the char used for value separation, must not be a line break character
     * @return a new CSV format.
     * @throws IllegalArgumentException if the delimiter is a line break character
     *
     * @see #DEFAULT
     * @see #RFC4180
     * @see #MYSQL
     * @see #EXCEL
     * @see #TDF
     */
    public static CSVFormat newFormat(final char delimiter) {
        return new CSVFormat(delimiter, null, null, null, null, false, false, null, null, null, false, false);
    }

    /**
     * Creates a customized CSV format.
     *
     * @param delimiter
     *            the char used for value separation, must not be a line break character
     * @param quoteChar
     *            the Character used as value encapsulation marker, may be {@code null} to disable
     * @param quotePolicy
     *            the quote policy
     * @param commentStart
     *            the Character used for comment identification, may be {@code null} to disable
     * @param escape
     *            the Character used to escape special characters in values, may be {@code null} to disable
     * @param ignoreSurroundingSpaces
     *            <tt>true</tt> when whitespaces enclosing values should be ignored
     * @param ignoreEmptyLines
     *            <tt>true</tt> when the parser should skip empty lines
     * @param recordSeparator
     *            the line separator to use for output
     * @param nullString
     *            the line separator to use for output
     * @param header
     *            the header
     * @param skipHeaderRecord TODO
     * @param ignoreEmptyHeaders TODO
     * @throws IllegalArgumentException if the delimiter is a line break character
     */
    private CSVFormat(final char delimiter, final Character quoteChar,
            final Quote quotePolicy, final Character commentStart,
            final Character escape, final boolean ignoreSurroundingSpaces,
            final boolean ignoreEmptyLines, final String recordSeparator,
            final String nullString, final String[] header, final boolean skipHeaderRecord,
            final boolean ignoreEmptyHeaders) {
        if (isLineBreak(delimiter)) {
            throw new IllegalArgumentException("The delimiter cannot be a line break");
        }
        this.delimiter = delimiter;
        this.quoteChar = quoteChar;
        this.quotePolicy = quotePolicy;
        this.commentStart = commentStart;
        this.escape = escape;
        this.ignoreSurroundingSpaces = ignoreSurroundingSpaces;
        this.ignoreEmptyHeaders = ignoreEmptyHeaders;
        this.ignoreEmptyLines = ignoreEmptyLines;
        this.recordSeparator = recordSeparator;
        this.nullString = nullString;
        if (header == null) {
            this.header = null;
        } else {
            final Set<String> dupCheck = new HashSet<String>();
            for (final String hdr : header) {
                if (!dupCheck.add(hdr)) {
                    throw new IllegalArgumentException("The header contains a duplicate entry: '" + hdr + "' in " +
                            Arrays.toString(header));
                }
            }
            this.header = header.clone();
        }
        this.skipHeaderRecord = skipHeaderRecord;
        validate();
    }

    @Override
    public boolean equals(final Object obj) {
        if (this == obj) {
            return true;
        }
        if (obj == null) {
            return false;
        }
        if (getClass() != obj.getClass()) {
            return false;
        }

        final CSVFormat other = (CSVFormat) obj;
        if (delimiter != other.delimiter) {
            return false;
        }
        if (quotePolicy != other.quotePolicy) {
            return false;
        }
        if (quoteChar == null) {
            if (other.quoteChar != null) {
                return false;
            }
        } else if (!quoteChar.equals(other.quoteChar)) {
            return false;
        }
        if (commentStart == null) {
            if (other.commentStart != null) {
                return false;
            }
        } else if (!commentStart.equals(other.commentStart)) {
            return false;
        }
        if (escape == null) {
            if (other.escape != null) {
                return false;
            }
        } else if (!escape.equals(other.escape)) {
            return false;
        }
        if (nullString == null) {
            if (other.nullString != null) {
                return false;
            }
        } else if (!nullString.equals(other.nullString)) {
            return false;
        }
        if (!Arrays.equals(header, other.header)) {
            return false;
        }
        if (ignoreSurroundingSpaces != other.ignoreSurroundingSpaces) {
            return false;
        }
        if (ignoreEmptyLines != other.ignoreEmptyLines) {
            return false;
        }
        if (skipHeaderRecord != other.skipHeaderRecord) {
            return false;
        }
        if (recordSeparator == null) {
            if (other.recordSeparator != null) {
                return false;
            }
        } else if (!recordSeparator.equals(other.recordSeparator)) {
            return false;
        }
        return true;
    }

    /**
     * Formats the specified values.
     *
     * @param values
     *            the values to format
     * @return the formatted values
     */
    public String format(final Object... values) {
        final StringWriter out = new StringWriter();
        try {
            new CSVPrinter(out, this).printRecord(values);
            return out.toString().trim();
        } catch (final IOException e) {
            // should not happen because a StringWriter does not do IO.
            throw new IllegalStateException(e);
        }
    }

    /**
     * Returns the character marking the start of a line comment.
     *
     * @return the comment start marker, may be {@code null}
     */
    public Character getCommentStart() {
        return commentStart;
    }

    /**
     * Returns the character delimiting the values (typically ';', ',' or '\t').
     *
     * @return the delimiter character
     */
    public char getDelimiter() {
        return delimiter;
    }

    /**
     * Returns the escape character.
     *
     * @return the escape character, may be {@code null}
     */
    public Character getEscape() {
        return escape;
    }

    /**
     * Returns a copy of the header array.
     *
     * @return a copy of the header array; {@code null} if disabled, the empty array if to be read from the file
     */
    public String[] getHeader() {
        return header != null ? header.clone() : null;
    }

    /**
     * Specifies whether empty headers are ignored when parsing the header line.
     *
     * @return <tt>true</tt> if headers are ignored when parsing the header line, <tt>false</tt> to throw an
     *         {@link IllegalArgumentException}.
     */
    public boolean isIgnoringEmptyHeaders() {
        return ignoreEmptyHeaders;
    }

    /**
     * Specifies whether empty lines between records are ignored when parsing input.
     *
     * @return <tt>true</tt> if empty lines between records are ignored, <tt>false</tt> if they are turned into empty
     *         records.
     */
    public boolean isIgnoringEmptyLines() {
        return ignoreEmptyLines;
    }

    /**
     * Specifies whether spaces around values are ignored when parsing input.
     *
     * @return <tt>true</tt> if spaces around values are ignored, <tt>false</tt> if they are treated as part of the
     *         value.
     */
    public boolean isIgnoringSurroundingSpaces() {
        return ignoreSurroundingSpaces;
    }

    /**
     * Gets the String to convert to and from {@code null}.
     * <ul>
     * <li>
     * <strong>Reading:</strong> Converts strings equal to the given {@code nullString} to {@code null} when reading
     * records.
     * </li>
     * <li>
     * <strong>Writing:</strong> Writes {@code null} as the given {@code nullString} when writing records.</li>
     * </ul>
     *
     * @return the String to convert to and from {@code null}. No substitution occurs if {@code null}
     */
    public String getNullString() {
        return nullString;
    }

    /**
     * Returns the character used to encapsulate values containing special characters.
     *
     * @return the quoteChar character, may be {@code null}
     */
    public Character getQuoteChar() {
        return quoteChar;
    }

    /**
     * Returns the quote policy output fields.
     *
     * @return the quote policy
     */
    public Quote getQuotePolicy() {
        return quotePolicy;
    }

    /**
     * Returns the record separator delimiting output records.
     *
     * @return the record separator
     */
    public String getRecordSeparator() {
        return recordSeparator;
    }

    /**
     * Returns whether to skip the header record.
     *
     * @return whether to skip the header record.
     */
    public boolean isSkippingHeaderRecord() {
        return skipHeaderRecord;
    }

    @Override
    public int hashCode()
    {
        final int prime = 31;
        int result = 1;

        result = prime * result + delimiter;
        result = prime * result + ((quotePolicy == null) ? 0 : quotePolicy.hashCode());
        result = prime * result + ((quoteChar == null) ? 0 : quoteChar.hashCode());
        result = prime * result + ((commentStart == null) ? 0 : commentStart.hashCode());
        result = prime * result + ((escape == null) ? 0 : escape.hashCode());
        result = prime * result + ((nullString == null) ? 0 : nullString.hashCode());
        result = prime * result + (ignoreSurroundingSpaces ? 1231 : 1237);
        result = prime * result + (ignoreEmptyLines ? 1231 : 1237);
        result = prime * result + (skipHeaderRecord ? 1231 : 1237);
        result = prime * result + ((recordSeparator == null) ? 0 : recordSeparator.hashCode());
        result = prime * result + Arrays.hashCode(header);
        return result;
    }

    /**
     * Specifies whether comments are supported by this format.
     *
     * Note that the comment introducer character is only recognized at the start of a line.
     *
     * @return <tt>true</tt> is comments are supported, <tt>false</tt> otherwise
     */
    public boolean isCommentingEnabled() {
        return commentStart != null;
    }

    /**
     * Returns whether escape are being processed.
     *
     * @return {@code true} if escapes are processed
     */
    public boolean isEscaping() {
        return escape != null;
    }

    /**
     * Returns whether a nullString has been defined.
     *
     * @return {@code true} if a nullString is defined
     */
    public boolean isHandlingNull() {
        return nullString != null;
    }

    /**
     * Returns whether a quoteChar has been defined.
     *
     * @return {@code true} if a quoteChar is defined
     */
    public boolean isQuoting() {
        return quoteChar != null;
    }

    /**
     * Parses the specified content.
     *
     * <p>
     * See also the various static parse methods on {@link CSVParser}.
     * </p>
     *
     * @param in
     *            the input stream
     * @return a parser over a stream of {@link CSVRecord}s.
     * @throws IOException
     *             If an I/O error occurs
     */
    public CSVParser parse(final Reader in) throws IOException {
        return new CSVParser(in, this);
    }

    /**
     * Prints to the specified output.
     *
     * <p>
     * See also {@link CSVPrinter}.
     * </p>
     *
     * @param out
     *        the output
     * @return a printer to an output
     * @throws IOException
     *         thrown if the optional header cannot be printed.
     */
    public CSVPrinter print(final Appendable out) throws IOException {
        return new CSVPrinter(out, this);
    }

    @Override
    public String toString() {
        final StringBuilder sb = new StringBuilder();
        sb.append("Delimiter=<").append(delimiter).append('>');
        if (isEscaping()) {
            sb.append(' ');
            sb.append("Escape=<").append(escape).append('>');
        }
        if (isQuoting()) {
            sb.append(' ');
            sb.append("QuoteChar=<").append(quoteChar).append('>');
        }
        if (isCommentingEnabled()) {
            sb.append(' ');
            sb.append("CommentStart=<").append(commentStart).append('>');
        }
        if (isHandlingNull()) {
            sb.append(' ');
            sb.append("NullString=<").append(nullString).append('>');
        }
        if(recordSeparator != null) {
            sb.append(' ');
            sb.append("RecordSeparator=<").append(recordSeparator).append('>');
        }
        if (isIgnoringEmptyLines()) {
            sb.append(" EmptyLines:ignored");
        }
        if (isIgnoringSurroundingSpaces()) {
            sb.append(" SurroundingSpaces:ignored");
        }
        sb.append(" SkipHeaderRecord:").append(skipHeaderRecord);
        if (header != null) {
            sb.append(' ');
            sb.append("Header:").append(Arrays.toString(header));
        }
        return sb.toString();
    }

    /**
     * Verifies the consistency of the parameters and throws an IllegalArgumentException if necessary.
     *
     * @throws IllegalArgumentException
     */
    private void validate() throws IllegalArgumentException {
        if (quoteChar != null && delimiter == quoteChar.charValue()) {
            throw new IllegalArgumentException(
                    "The quoteChar character and the delimiter cannot be the same ('" + quoteChar + "')");
        }

        if (escape != null && delimiter == escape.charValue()) {
            throw new IllegalArgumentException(
                    "The escape character and the delimiter cannot be the same ('" + escape + "')");
        }

        if (commentStart != null && delimiter == commentStart.charValue()) {
            throw new IllegalArgumentException(
                    "The comment start character and the delimiter cannot be the same ('" + commentStart + "')");
        }

        if (quoteChar != null && quoteChar.equals(commentStart)) {
            throw new IllegalArgumentException(
                    "The comment start character and the quoteChar cannot be the same ('" + commentStart + "')");
        }

        if (escape != null && escape.equals(commentStart)) {
            throw new IllegalArgumentException(
                    "The comment start and the escape character cannot be the same ('" + commentStart + "')");
        }

        if (escape == null && quotePolicy == Quote.NONE) {
            throw new IllegalArgumentException("No quotes mode set but no escape character is set");
        }
    }

    /**
     * Sets the comment start marker of the format to the specified character.
     *
     * Note that the comment start character is only recognized at the start of a line.
     *
     * @param commentMarker
     *            the comment start marker
     * @return A new CSVFormat that is equal to this one but with the specified character as the comment start marker
     * @throws IllegalArgumentException
     *             thrown if the specified character is a line break
     */
    public CSVFormat withCommentMarker(final char commentMarker) {
        return withCommentMarker(Character.valueOf(commentMarker));
    }

    /**
     * Sets the comment start marker of the format to the specified character.
     *
     * Note that the comment start character is only recognized at the start of a line.
     *
     * @param commentMarker
     *            the comment start marker, use {@code null} to disable
     * @return A new CSVFormat that is equal to this one but with the specified character as the comment start marker
     * @throws IllegalArgumentException
     *             thrown if the specified character is a line break
     */
    public CSVFormat withCommentMarker(final Character commentMarker) {
        if (isLineBreak(commentMarker)) {
            throw new IllegalArgumentException("The comment start marker character cannot be a line break");
        }
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentMarker, escape,
                ignoreSurroundingSpaces, ignoreEmptyLines, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }

    /**
     * Sets the delimiter of the format to the specified character.
     *
     * @param delimiter
     *            the delimiter character
     * @return A new CSVFormat that is equal to this with the specified character as delimiter
     * @throws IllegalArgumentException
     *             thrown if the specified character is a line break
     */
    public CSVFormat withDelimiter(final char delimiter) {
        if (isLineBreak(delimiter)) {
            throw new IllegalArgumentException("The delimiter cannot be a line break");
        }
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentStart, escape,
                ignoreSurroundingSpaces, ignoreEmptyLines, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }

    /**
     * Sets the escape character of the format to the specified character.
     *
     * @param escape
     *            the escape character
     * @return A new CSVFormat that is equal to his but with the specified character as the escape character
     * @throws IllegalArgumentException
     *             thrown if the specified character is a line break
     */
    public CSVFormat withEscape(final char escape) {
        return withEscape(Character.valueOf(escape));
    }

    /**
     * Sets the escape character of the format to the specified character.
     *
     * @param escape
     *            the escape character, use {@code null} to disable
     * @return A new CSVFormat that is equal to this but with the specified character as the escape character
     * @throws IllegalArgumentException
     *             thrown if the specified character is a line break
     */
    public CSVFormat withEscape(final Character escape) {
        if (isLineBreak(escape)) {
            throw new IllegalArgumentException("The escape character cannot be a line break");
        }
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentStart, escape,
                ignoreSurroundingSpaces, ignoreEmptyLines, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }

    /**
     * Sets the header of the format. The header can either be parsed automatically from the input file with:
     *
     * <pre>
     * CSVFormat format = aformat.withHeader();</pre>
     *
     * or specified manually with:
     *
     * <pre>
     * CSVFormat format = aformat.withHeader("name", "email", "phone");</pre>
     *
     * @param header
     *            the header, <tt>null</tt> if disabled, empty if parsed automatically, user specified otherwise.
     *
     * @return A new CSVFormat that is equal to this but with the specified header
     * @see #withSkipHeaderRecord(boolean)
     */
    public CSVFormat withHeader(final String... header) {
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentStart, escape,
                ignoreSurroundingSpaces, ignoreEmptyLines, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }

    /**
     * Sets the empty header behavior of the format.
     *
     * @param ignoreEmptyHeaders
     *            the empty header behavior, <tt>true</tt> to ignore empty headers in the header line,
     *            <tt>false</tt> to cause an {@link IllegalArgumentException} to be thrown.
     * @return A new CSVFormat that is equal to this but with the specified empty header behavior.
     */
    public CSVFormat withIgnoreEmptyHeaders(final boolean ignoreEmptyHeaders) {
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentStart, escape,
                ignoreSurroundingSpaces, ignoreEmptyHeaders, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }

    /**
     * Sets the empty line skipping behavior of the format.
     *
     * @param ignoreEmptyLines
     *            the empty line skipping behavior, <tt>true</tt> to ignore the empty lines between the records,
     *            <tt>false</tt> to translate empty lines to empty records.
     * @return A new CSVFormat that is equal to this but with the specified empty line skipping behavior.
     */
    public CSVFormat withIgnoreEmptyLines(final boolean ignoreEmptyLines) {
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentStart, escape,
                ignoreSurroundingSpaces, ignoreEmptyLines, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }

    /**
     * Sets the trimming behavior of the format.
     *
     * @param ignoreSurroundingSpaces
     *            the trimming behavior, <tt>true</tt> to remove the surrounding spaces, <tt>false</tt> to leave the
     *            spaces as is.
     * @return A new CSVFormat that is equal to this but with the specified trimming behavior.
     */
    public CSVFormat withIgnoreSurroundingSpaces(final boolean ignoreSurroundingSpaces) {
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentStart, escape,
                ignoreSurroundingSpaces, ignoreEmptyLines, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }

    /**
     * Performs conversions to and from null for strings on input and output.
     * <ul>
     * <li>
     * <strong>Reading:</strong> Converts strings equal to the given {@code nullString} to {@code null} when reading
     * records.</li>
     * <li>
     * <strong>Writing:</strong> Writes {@code null} as the given {@code nullString} when writing records.</li>
     * </ul>
     *
     * @param nullString
     *            the String to convert to and from {@code null}. No substitution occurs if {@code null}
     *
     * @return A new CSVFormat that is equal to this but with the specified null conversion string.
     */
    public CSVFormat withNullString(final String nullString) {
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentStart, escape,
                ignoreSurroundingSpaces, ignoreEmptyLines, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }

    /**
     * Sets the quoteChar of the format to the specified character.
     *
     * @param quoteChar
     *            the quoteChar character
     * @return A new CSVFormat that is equal to this but with the specified character as quoteChar
     * @throws IllegalArgumentException
     *             thrown if the specified character is a line break
     */
    public CSVFormat withQuoteChar(final char quoteChar) {
        return withQuoteChar(Character.valueOf(quoteChar));
    }

    /**
     * Sets the quoteChar of the format to the specified character.
     *
     * @param quoteChar
     *            the quoteChar character, use {@code null} to disable
     * @return A new CSVFormat that is equal to this but with the specified character as quoteChar
     * @throws IllegalArgumentException
     *             thrown if the specified character is a line break
     */
    public CSVFormat withQuoteChar(final Character quoteChar) {
        if (isLineBreak(quoteChar)) {
            throw new IllegalArgumentException("The quoteChar cannot be a line break");
        }
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentStart, escape,
                ignoreSurroundingSpaces, ignoreEmptyLines, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }

    /**
     * Sets the output quote policy of the format to the specified value.
     *
     * @param quotePolicy
     *            the quote policy to use for output.
     *
     * @return A new CSVFormat that is equal to this but with the specified quote policy
     */
    public CSVFormat withQuotePolicy(final Quote quotePolicy) {
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentStart, escape,
                ignoreSurroundingSpaces, ignoreEmptyLines, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }

    /**
     * Sets the record separator of the format to the specified character.
     *
     * <p><strong>Note:</strong> This setting is only used during printing and does not affect parsing. Parsing currently
     * only works for inputs with '\n', '\r' and "\r\n"</p>
     *
     * @param recordSeparator
     *            the record separator to use for output.
     *
     * @return A new CSVFormat that is equal to this but with the the specified output record separator
     */
    public CSVFormat withRecordSeparator(final char recordSeparator) {
        return withRecordSeparator(String.valueOf(recordSeparator));
    }

    /**
     * Sets the record separator of the format to the specified String.
     *
     * <p><strong>Note:</strong> This setting is only used during printing and does not affect parsing. Parsing currently
     * only works for inputs with '\n', '\r' and "\r\n"</p>
     *
     * @param recordSeparator
     *            the record separator to use for output.
     *
     * @return A new CSVFormat that is equal to this but with the the specified output record separator
     * @throws IllegalArgumentException
     *              if recordSeparator is none of CR, LF or CRLF
     */
    public CSVFormat withRecordSeparator(final String recordSeparator) {
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentStart, escape,
                ignoreSurroundingSpaces, ignoreEmptyLines, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }

    /**
     * Sets whether to skip the header record.
     *
     * @param skipHeaderRecord
     *            whether to skip the header record.
     *
     * @return A new CSVFormat that is equal to this but with the the specified skipHeaderRecord setting.
     * @see #withHeader(String...)
     */
    public CSVFormat withSkipHeaderRecord(final boolean skipHeaderRecord) {
        return new CSVFormat(delimiter, quoteChar, quotePolicy, commentStart, escape,
                ignoreSurroundingSpaces, ignoreEmptyLines, recordSeparator, nullString, header, skipHeaderRecord,
                ignoreEmptyHeaders);
    }
}