HttpRequestURIDecoder.java example

Explorer

Grizzly-master
- contribs
  - grizzly-httpservice
    - src
      - main
        java
        com
        sun
        grizzly
        osgi
        httpservice
        Activator.java
        HttpContextImpl.java
        HttpServiceFactory.java
        HttpServiceImpl.java
        OSGiAuthFilter.java
        OSGiCleanMapper.java
        OSGiGrizzlyAdapter.java
        OSGiMainAdapter.java
        OSGiResourceAdapter.java
        OSGiServletAdapter.java
        OSGiServletContext.java
        util
        Logger.java
      - test
        java
        com
        sun
        grizzly
        osgi
        httpservice
        OSGiCleanMapperTest.java
  - httpclient
    - src
      - main
        java
        com
        sun
        grizzly
        httpclient
        GrizzlyHttpClient.java
        HttpClientRequest.java
        HttpClientResponse.java
        HttpMethod.java
        HttpProtocolVersion.java
      - test
        java
        com
        sun
        grizzly
        httpclient
        HttpClientGetTest.java
  - httpservice-its
    - src
      - main
        java
        com
        sun
        grizzly
        osgi
        httpservice
        its
        impl
        Activator.java
        Logger.java
      - test
        java
        com
        sun
        grizzly
        osgi
        httpservice
        its
        impl
        AuthenticationTest.java
        RegisterOverlappingResourceTest.java
        RegisterSevletTest.java
        RegisterUnderUsedAliasTest.java
        ResourceAvailableTest.java
        ServletAvailableTest.java
        UnregisterNotOwnedAliasTest.java
  - jsp-support
    - src
      - test
        java
        com
        sun
        grizzly
        http
        servlet
        deployer
        WebDefaultSupportTest.java
- extras
  - cachetest
    - src
      - main
        java
        com
        sun
        grizzly
        test
        cachetest
        ConcurrentCacheTester.java
        InstanceFactory.java
        TestAndResult.java
        TestLogic.java
        testobjects
        SelectionKeyOP.java
  - cometd-client
    - src
      - main
        java
        dojox
        cometd
        Bayeux.java
        Channel.java
        Client.java
        DataFilter.java
        Extension.java
        Listener.java
        Message.java
        MessageListener.java
        RemoveListener.java
        SecurityPolicy.java
        org
        mortbay
        cometd
        client
        BayeuxClient.java
        BayeuxLoadGenerator.java
      - test
        java
        com
        sun
        grizzly
        cometd
        client
        BayeuxClientLoadTest.java
  - grizzlet
    - src
      - main
        java
        com
        sun
        grizzly
        container
        AsyncConnectionImpl.java
        GrizzletAdapter.java
        GrizzletCometHandler.java
        GrizzletRequest.java
        GrizzletResponse.java
        grizzlet
        AlreadyPausedException.java
        AsyncConnection.java
        Grizzlet.java
        NotYetPausedException.java
  - http-ajp
    - src
      - main
        java
        com
        sun
        grizzly
        http
        jk
        apr
        AprImpl.java
        common
        AjpConstants.java
        ChannelJni.java
        ChannelNioSocket.java
        ChannelShm.java
        ChannelSocket.java
        ChannelUn.java
        HandlerDispatch.java
        HandlerRequest.java
        JkInputStream.java
        JniHandler.java
        MsgAjp.java
        Shm.java
        Shm14.java
        WorkerDummy.java
        core
        JkChannel.java
        JkHandler.java
        Msg.java
        MsgContext.java
        WorkerEnv.java
        server
        JkCoyoteHandler.java
        JkMain.java
        util
        res
        StringManager.java
        threads
        ThreadPool.java
        ThreadPoolRunnable.java
        ThreadWithAttributes.java
  - hudson-on-grizzly
    - src
      - main
        java
        com
        sun
        grizzly
        hudson
        Hudson.java
  - lzma
    - src
      - main
        java
        com
        sun
        grizzly
        lzma
        CRC.java
        ICodeProgress.java
        LzmaAlone.java
        LzmaBench.java
        compression
        lz
        BinTree.java
        InWindow.java
        OutWindow.java
        lzma
        Base.java
        Decoder.java
        Encoder.java
        rangecoder
        BitTreeDecoder.java
        BitTreeEncoder.java
        Decoder.java
        Encoder.java
  - messages-bus
    - src
      - main
        java
        com
        sun
        grizzly
        messagesbus
        MessagesBus.java
        MessagesBusCometHandler.java
- modules
- samples
  - comet
    - comet-chat
      - src
        main
        java
        com
        sun
        grizzly
        samples
        comet
        AjaxCometServlet.java
    - comet-chat-iframe
      - src
        main
        java
        com
        sun
        grizzly
        samples
        comet
        iframechat
        CometServlet.java
    - comet-counter
      - src
        main
        java
        com
        sun
        grizzly
        samples
        comet
        LongPollingServlet.java
    - comet-hidden
      - src
        main
        java
        com
        sun
        grizzly
        samples
        comet
        HiddenCometServlet.java
    - comet-jmaki
      - src
        main
        java
        com
        sun
        grizzly
        samples
        comet
        CometServlet.java
    - cometd-javaapiupdate-chat
      - src
        main
        java
        com
        sun
        grizzly
        bayeux
        BayeuxExternalServlet.java
    - twitter
      - src
        main
        java
        com
        sun
        grizzly
        samples
        comet
        TwitterServlet.java
  - framework
    - filters-samples
      - src
        main
        java
        com
        sun
        grizzly
        filter
        BytesTrafficListener.java
        Client.java
        ClosedMessage.java
        CustomProtocolClient.java
        CustomProtocolHelper.java
        CustomProtocolParser.java
        CustomProtocolServer.java
        FragmentMessage.java
        IOExceptionHandler.java
        InputStreamMessage.java
        Message.java
        MessageBase.java
        MessageDispatcher.java
        MessageError.java
        MessageParseException.java
        ProtocolOutputStream.java
        ProxyCallbackHandler.java
        RemoteCall.java
        RemoteInputStream.java
        ReplyMessage.java
        ReplyMessageFactory.java
        RequestMessage.java
        SSLPreProcessor.java
        Server.java
        standalone
        framework
        Example_1_Client.java
        Example_1_Server.java
        Main.java
        MainSSL.java
    - nio-migration-guide
      - demo1
        src
        main
        java
        com
        sun
        grizzly
        samples
        migration
        NIOGateway.java
        QuoteManager.java
        command
        BasicCommand.java
        FeedCommand.java
        ICommand.java
        ICommandRequest.java
        QuitCommand.java
        QuoteCommand.java
        connection
        handler
        ClientConnectionHandler.java
        SocketConnectionListener.java
        ThirdPartyConnectionHandler.java
        dao
        Quote.java
        response
        FeedCommandRequest.java
        QuoteCommandRequest.java
        handler
        FeedResponseHandler.java
        IResponseHandler.java
        QuoteResponseHandler.java
      - demo2
        src
        main
        java
        com
        sun
        grizzly
        samples
        migration
        NIOGateway.java
        QuoteManager.java
        command
        BasicCommand.java
        FeedCommand.java
        ICommand.java
        ICommandRequest.java
        QuitCommand.java
        QuoteCommand.java
        connection
        handler
        ClientConnectionHandler.java
        SocketConnectionListener.java
        ThirdPartyConnectionHandler.java
        dao
        Quote.java
        response
        FeedCommandRequest.java
        QuoteCommandRequest.java
        handler
        FeedResponseHandler.java
        IResponseHandler.java
        QuoteResponseHandler.java
      - demo3
        src
        main
        java
        com
        sun
        grizzly
        samples
        migration
        GrizzlyGateway.java
        QuoteManager.java
        command
        BasicCommand.java
        FeedCommand.java
        ICommand.java
        ICommandRequest.java
        QuitCommand.java
        QuoteCommand.java
        connection
        handler
        ClientConnectionHandler.java
        GrizzlyConnectionListener.java
        ThirdPartyConnectionHandler.java
        filter
        QuoteQueryManagerFilter.java
        QuoteQueryProtocolFilter.java
        parser
        QuoteQueryProtocolParser.java
        dao
        Quote.java
        response
        FeedCommandRequest.java
        QuoteCommandRequest.java
        handler
        FeedResponseHandler.java
        IResponseHandler.java
        QuoteResponseHandler.java
  - http
    - http-embed
      - src
        main
        java
        com
        sun
        grizzly
        samples
        http
        embed
        GrizzlyEmbedWebServer.java
    - multiple-adapter
      - src
        main
        java
        com
        sun
        grizzly
        samples
        http
        adapter
        GrizzlyEmbedWebServer.java
  - websockets
    - chat
      - src
        main
        java
        com
        sun
        grizzly
        samples
        websockets
        ChatApplication.java
        ChatWebSocket.java
        WebSocketsServlet.java
        test
        java
        com
        sun
        grizzly
        websockets
        Main.java

/*
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
 *
 * Copyright (c) 2008-2010 Oracle and/or its affiliates. All rights reserved.
 *
 * The contents of this file are subject to the terms of either the GNU
 * General Public License Version 2 only ("GPL") or the Common Development
 * and Distribution License("CDDL") (collectively, the "License").  You
 * may not use this file except in compliance with the License.  You can
 * obtain a copy of the License at
 * https://glassfish.dev.java.net/public/CDDL+GPL_1_1.html
 * or packager/legal/LICENSE.txt.  See the License for the specific
 * language governing permissions and limitations under the License.
 *
 * When distributing the software, include this License Header Notice in each
 * file and include the License file at packager/legal/LICENSE.txt.
 *
 * GPL Classpath Exception:
 * Oracle designates this particular file as subject to the "Classpath"
 * exception as provided by Oracle in the GPL Version 2 section of the License
 * file that accompanied this code.
 *
 * Modifications:
 * If applicable, add the following below the License Header, with the fields
 * enclosed by brackets [] replaced by your own identifying information:
 * "Portions Copyright [year] [name of copyright owner]"
 *
 * Contributor(s):
 * If you wish your version of this file to be governed by only the CDDL or
 * only the GPL Version 2, indicate your decision by adding "[Contributor]
 * elects to include this software in this distribution under the [CDDL or GPL
 * Version 2] license."  If you don't indicate a single choice of license, a
 * recipient has the option to distribute your version of this file under
 * either the CDDL, the GPL Version 2 or to extend the choice of license to
 * its licensees as provided above.  However, if you add GPL Version 2 code
 * and therefore, elected the GPL Version 2 license, then the option applies
 * only if the new code is made subject to such option by the copyright
 * holder.
 */

package com.sun.grizzly.util.http;

import com.sun.grizzly.util.buf.B2CConverter;
import com.sun.grizzly.util.buf.ByteChunk;
import com.sun.grizzly.util.buf.CharChunk;
import com.sun.grizzly.util.buf.MessageBytes;
import com.sun.grizzly.util.buf.UDecoder;
import java.io.IOException;
import java.util.logging.Level;
import java.util.logging.Logger;

/**
 * Utility class that make sure an HTTP url defined inside a {@link MessagesBytes}
 * is normalized, converted and valid. It also makes sure there is no security
 * hole. Mainly, this class can be used by doing:
 * <p><pre><code>
 * 
 * HttpRequestURIDecoder.decode(decodedURI, urlDecoder, encoding, b2cConverter);
 * 
 * </code></pre></code>
 * 
 * @author Jeanfrancois Arcand
 */
public class HttpRequestURIDecoder {

    protected static final boolean ALLOW_BACKSLASH = false;
    private static final boolean COLLAPSE_ADJACENT_SLASHES = 
            Boolean.valueOf(System.getProperty("com.sun.enterprise.web.collapseAdjacentSlashes"
            , "true")).booleanValue();
    private static Logger log = Logger.getLogger(
            HttpRequestURIDecoder.class.getName());

    /**
     * Decode the http request represented by the bytes inside {@link MessageBytes}
     * using an {@link UDecoder}. 
     * @param decodedURI - The bytes to decode
     * @param urlDecoder - The urlDecoder to use to decode.
     * @throws java.lang.Exception
     */
    public final static void decode(MessageBytes decodedURI, UDecoder urlDecoder)
            throws Exception {
        decode(decodedURI, urlDecoder, null, null);
    }

    /**
     * Decode the http request represented by the bytes inside {@link MessageBytes}
     * using an {@link UDecoder}, using the specified encoding, using the specified 
     * [@link B2CConverter} to decode the request. 
     * @param decodedURI - The bytes to decode
     * @param urlDecoder - The urlDecoder to use to decode.
     * @param encoding the encoding value, default is utf-8.
     * @param b2cConverter the Bytes to Char Converter.
     * @throws java.lang.Exception
     */
    public final static void decode(MessageBytes decodedURI, UDecoder urlDecoder,
            String encoding, B2CConverter b2cConverter) throws Exception {
        // %xx decoding of the URL
        urlDecoder.convert(decodedURI, false);

        if (!normalize(decodedURI)) {
            throw new IOException("Invalid URI character encoding");
        }

        if (encoding == null) {
            encoding = "utf-8";
        }

        convertURI(decodedURI, encoding, b2cConverter);

        // Check that the URI is still normalized
        if (!checkNormalize(decodedURI)) {
            throw new IOException("Invalid URI character encoding");
        }
    }

    /**
     * Convert a URI using the specified encoding, using the specified 
     * [@link B2CConverter} to decode the request.
     * @param uri - The bytes to decode
     * @param encoding the encoding value
     * @param b2cConverter the Bytes to Char Converter.
     * @throws java.lang.Exception
     */
    private final static void convertURI(MessageBytes uri, String encoding,
            B2CConverter b2cConverter)
            throws Exception {

        ByteChunk bc = uri.getByteChunk();
        CharChunk cc = uri.getCharChunk();
        cc.allocate(bc.getLength(), -1);

        if (encoding != null && encoding.trim().length() != 0 &&
                !"ISO-8859-1".equalsIgnoreCase(encoding)) {
            try {
                if (b2cConverter == null) {
                    b2cConverter = new B2CConverter(encoding);
                }
            } catch (IOException e) {
                // Ignore
                 log.severe("Invalid URI encoding; using HTTP default");
            }
            if (b2cConverter != null) {
                try {
                    b2cConverter.convert(bc, cc);
                    uri.setChars(cc.getBuffer(), cc.getStart(),
                            cc.getLength());
                    return;
                } catch (IOException e) {
                     log.severe("Invalid URI character encoding; trying ascii");
                    cc.recycle();
                }
            }
        }

        // Default encoding: fast conversion
        byte[] bbuf = bc.getBuffer();
        char[] cbuf = cc.getBuffer();
        int start = bc.getStart();
        for (int i = 0; i < bc.getLength(); i++) {
            cbuf[i] = (char) (bbuf[i + start] & 0xff);
        }
        uri.setChars(cbuf, 0, bc.getLength());

    }

    
    /**
     * Normalize URI.
     * <p>
     * This method normalizes "\", "//", "/./" and "/../". This method will
     * return false when trying to go above the root, or if the URI contains
     * a null byte.
     * 
     * @param uriMB URI to be normalized
     */
    public static boolean normalize(MessageBytes uriMB) {

        int type = uriMB.getType();
        if (type == MessageBytes.T_CHARS) {
            return normalizeChars(uriMB);
        } else {
            return normalizeBytes(uriMB);
        }
    }


    /**
     * Check that the URI is normalized following character decoding.
     * <p>
     * This method checks for "\", 0, "//", "/./" and "/../". This method will
     * return false if sequences that are supposed to be normalized are still 
     * present in the URI.
     * 
     * @param uriMB URI to be checked (should be chars)
     */
    public static boolean checkNormalize(MessageBytes uriMB) {

        CharChunk uriCC = uriMB.getCharChunk();
        char[] c = uriCC.getChars();
        int start = uriCC.getStart();
        int end = uriCC.getEnd();

        int pos = 0;

        // Check for '\' and 0
        for (pos = start; pos < end; pos++) {
            if (c[pos] == '\\') {
                return false;
            }
            if (c[pos] == 0) {
                return false;
            }
        }

        // Check for "//"
        for (pos = start; pos < (end - 1); pos++) {
            if (c[pos] == '/') {
                if (c[pos + 1] == '/') {
                    return false;
                }
            }
        }

        // Check for ending with "/." or "/.."
        if (((end - start) >= 2) && (c[end - 1] == '.')) {
            if ((c[end - 2] == '/') 
                    || ((c[end - 2] == '.') 
                    && (c[end - 3] == '/'))) {
                return false;
            }
        }

        // Check for "/./"
        if (uriCC.indexOf("/./", 0, 3, 0) >= 0) {
            return false;
        }

        return true;

    }


    private static boolean normalizeChars(MessageBytes uriMB) {

        CharChunk uriCC = uriMB.getCharChunk();
        char[] c = uriCC.getChars();
        int start = uriCC.getStart();
        int end = uriCC.getEnd();

        // URL * is acceptable
        if ((end - start == 1) && c[start] == (char) '*') {
            return true;
        }

        int pos = 0;
        int index = 0;

        // Replace '\' with '/'
        // Check for null char
        for (pos = start; pos < end; pos++) {
            if (c[pos] == (char) '\\') {
                if (ALLOW_BACKSLASH) {
                    c[pos] = (char) '/';
                } else {
                    return false;
                }
            }
            if (c[pos] == (char) 0) {
                return false;
            }
        }

        // The URL must start with '/'
        if (c[start] != (char) '/') {
            return false;
        }

        // Replace "//" with "/"
        if (COLLAPSE_ADJACENT_SLASHES) {
            for (pos = start; pos < (end - 1); pos++) {
                if (c[pos] == (char) '/') {
                    while ((pos + 1 < end) && (c[pos + 1] == (char) '/')) {
                        copyChars(c, pos, pos + 1, end - pos - 1);
                        end--;
                    }
                }
            }
        }

        // If the URI ends with "/." or "/..", then we append an extra "/"
        // Note: It is possible to extend the URI by 1 without any side effect
        // as the next character is a non-significant WS.
        if (((end - start) > 2) && (c[end - 1] == (char) '.')) {
            if ((c[end - 2] == (char) '/') || ((c[end - 2] == (char) '.') && (c[end - 3] == (char) '/'))) {
                c[end] = (char) '/';
                end++;
            }
        }

        uriCC.setEnd(end);

        index = 0;

        // Resolve occurrences of "/./" in the normalized path
        while (true) {
            index = uriCC.indexOf("/./", 0, 3, index);
            if (index < 0) {
                break;
            }
            copyChars(c, start + index, start + index + 2,
                    end - start - index - 2);
            end = end - 2;
            uriCC.setEnd(end);
        }

        index = 0;

        // Resolve occurrences of "/../" in the normalized path
        while (true) {
            index = uriCC.indexOf("/../", 0, 4, index);
            if (index < 0) {
                break;
            }
            // Prevent from going outside our context
            if (index == 0) {
                return false;
            }
            int index2 = -1;
            for (pos = start + index - 1; (pos >= 0) && (index2 < 0); pos--) {
                if (c[pos] == (char) '/') {
                    index2 = pos;
                }
            }
            copyChars(c, start + index2, start + index + 3,
                    end - start - index - 3);
            end = end + index2 - index - 3;
            uriCC.setEnd(end);
            index = index2;
        }

        uriCC.setChars(c, start, end);

        return true;

    }

    // ------------------------------------------------------ Protected Methods
    /**
     * Copy an array of bytes to a different position. Used during 
     * normalization.
     */
    protected static void copyBytes(byte[] b, int dest, int src, int len) {
        System.arraycopy(b, src, b, dest, len);
    }

    /**
     * Copy an array of chars to a different position. Used during 
     * normalization.
     */
    private static void copyChars(char[] c, int dest, int src, int len) {
        System.arraycopy(c, src, c, dest, len);
    }

    /**
     * Log a message on the Logger associated with our Container (if any)
     *
     * @param message Message to be logged
     */
    protected void log(String message) {
        log.info(message);
    }

    /**
     * Log a message on the Logger associated with our Container (if any)
     *
     * @param message Message to be logged
     * @param throwable Associated exception
     */
    protected void log(String message, Throwable throwable) {
        log.log(Level.SEVERE, message, throwable);
    }

    /**
     * Character conversion of the a US-ASCII MessageBytes.
     */
    protected void convertMB(MessageBytes mb) {

        // This is of course only meaningful for bytes
        if (mb.getType() != MessageBytes.T_BYTES) {
            return;
        }

        ByteChunk bc = mb.getByteChunk();
        CharChunk cc = mb.getCharChunk();
        cc.allocate(bc.getLength(), -1);

        // Default encoding: fast conversion
        byte[] bbuf = bc.getBuffer();
        char[] cbuf = cc.getBuffer();
        int start = bc.getStart();
        for (int i = 0; i < bc.getLength(); i++) {
            cbuf[i] = (char) (bbuf[i + start] & 0xff);
        }
        mb.setChars(cbuf, 0, bc.getLength());

    }
    
    private static final int STATE_CHAR=0;
    private static final int STATE_SLASH=1;
    private static final int STATE_PERCENT=2;
    private static final int STATE_SLASHDOT=3;
    private static final int STATE_SLASHDOTDOT=4;    
    
    public static boolean normalizeBytes (MessageBytes mb) {
        ByteChunk bc = mb.getByteChunk();
        byte[] bs = bc.getBytes();
        int start = bc.getStart();
        int end = bc.getEnd();
        
        // An empty URL is not acceptable
        if (start == end) {
            return false;
        }

        // URL * is acceptable
        if ((end - start == 1) && bs[start] == (byte) '*') {
            return true;
        }
        
        // If the URI ends with "/." or "/..", then we append an extra "/"
        // Note: It is possible to extend the URI by 1 without any side effect
        // as the next character is a non-significant WS.
        if (((end - start) > 2) && (bs[end - 1] == (byte) '.')) {
            if ((bs[end - 2] == (byte) '/') || ((bs[end - 2] == (byte) '.') && (bs[end - 3] == (byte) '/'))) {
                bs[end] = (byte) '/';
                end++;
            }
        }
        
        int state = STATE_CHAR;
        int srcPos = start;
        
        int lastSlash = -1;
        int parentSlash = -1;
        
        for (int pos=start; pos<end; pos++) {
            if (bs[pos] == (byte) 0)
                return false;
            if (bs[pos] == (byte) '\\') {
                if (ALLOW_BACKSLASH) {
                    bs[pos] = (byte) '/';
                } else {
                    return false;
                }
            }
            if (bs[pos] == '/') {
                if (state == STATE_CHAR) {
                    state = STATE_SLASH;
                    bs[srcPos] = bs[pos];
                    parentSlash = lastSlash;
                    lastSlash = srcPos;
                    srcPos++;
                }
                else if (state == STATE_SLASH) {
                    // This is '//'. Ignore if COLLAPSE_ADJACENT_SLASHES is true.
                    // What is the behavior for '/../' patterns if collapse is false.
                    // Ignoring for now.
                    if (!COLLAPSE_ADJACENT_SLASHES)
                        srcPos++;
                }
                else if (state == STATE_SLASHDOT) {
                    // This is '/./' ==> move the srcPos one position back 
                    srcPos--;
                }
                else if (state == STATE_SLASHDOTDOT) {
                    // This is '/../' ==> search backward to reset lastSlash and parentSlash
                    if (parentSlash == -1) {
                        // This is an error
                        return false;
                    }
                    else {
                        lastSlash = parentSlash;
                        srcPos = parentSlash;
                        // Find the parentSlash
                        parentSlash = -1;
                        for (int i=lastSlash-1; i>=start; i--) {
                            if (bs[i] == '/') {
                               parentSlash = i;
                               break;
                            }
                        }
                    }
                    state = STATE_SLASH;
                    bs[srcPos++] = bs[pos];
                }
            }
            else if (bs[pos] == '.') {
                if (state == STATE_CHAR) {
                    bs[srcPos++] = bs[pos];
                }
                else if (state == STATE_SLASH) {
                    state = STATE_SLASHDOT;
                    bs[srcPos++] = bs[pos];
                }
                else if (state == STATE_SLASHDOT) {
                    state = STATE_SLASHDOTDOT;
                    bs[srcPos++] = bs[pos];
                }
            }
            else {
                state = STATE_CHAR;
                bs[srcPos++] = bs[pos];
            }
        }
        
        bc.setEnd(srcPos);
        return true;
    }
}