/* * ChunkedConsumer.java February 2007 * * Copyright (C) 2007, Niall Gallagher <niallg@users.sf.net> * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or * implied. See the License for the specific language governing * permissions and limitations under the License. */ package org.simpleframework.http.message; import java.io.IOException; import org.simpleframework.util.buffer.Allocator; import org.simpleframework.util.buffer.Buffer; /** * The <code>ChunkedConsumer</code> is reads an decodes a stream using the * chunked transfer coding. This is used so that any data sent in the chunked * transfer coding can be decoded. All bytes are appended to an internal buffer * so that they can be read without having to parse the encoding. * * <pre> * * length := 0 * read chunk-size, chunk-extension (if any) and CRLF * while (chunk-size > 0) { * read chunk-data and CRLF * append chunk-data to entity-body * length := length + chunk-size * read chunk-size and CRLF * } * read entity-header * while (entity-header not empty) { * append entity-header to existing header fields * read entity-header * } * * </pre> * * The above algorithm is taken from RFC 2616 section 19.4.6. This coding scheme * is used in HTTP pipelines so that dynamic content, that is, content with * which a length cannot be determined does not require a connection close to * delimit the message body. * * @author Niall Gallagher */ public class ChunkedConsumer extends UpdateConsumer { /** * This is used to create the internal buffer for the body. */ private Allocator allocator; /** * This is the internal buffer used to capture the body read. */ private Buffer buffer; /** * This is used to determine whether a full chunk has been read. */ private boolean terminal; /** * This is used to determine if the zero length chunk was read. */ private boolean last; /** * This is used to accumulate the bytes of the chunk size line. */ private byte line[]; /** * This is the number of bytes appended to the line buffer. */ private int count; /** * This is the number of bytes left in the current chunk. */ private int chunk; /** * Constructor for the <code>ChunkedConsumer</code> object. This is used to * create a consumer that reads chunked encoded data and appended that data * in decoded form to an internal buffer so that it can be read in a clean * decoded fromat. * * @param allocator * this is used to allocate the internal buffer */ public ChunkedConsumer(Allocator allocator) { this(allocator, 1024); } /** * Constructor for the <code>ChunkedConsumer</code> object. This is used to * create a consumer that reads chunked encoded data and appended that data * in decoded form to an internal buffer so that it can be read in a clean * decoded fromat. * * @param allocator * this is used to allocate the internal buffer * @param chunk * this is the maximum size line allowed */ private ChunkedConsumer(Allocator allocator, int chunk) { this.line = new byte[chunk]; this.allocator = allocator; } /** * This is used to acquire the body that has been consumed. This will return * a body which can be used to read the content of the message, also if the * request is multipart upload then all of the parts are provided as * <code>Attachment</code> objects. Each part can then be read as an * individual message. * * @return the body that has been consumed by this instance */ @Override public Body getBody() { return new BufferBody(this.buffer); } /** * This method is used to append the contents of the array to the internal * buffer. The appended bytes can be acquired from the internal buffer using * an <code>InputStream</code>, or the text of the appended bytes can be * acquired by encoding the bytes. * * @param array * this is the array of bytes to be appended * @param off * this is the start offset in the array to read from * @param len * this is the number of bytes to write to the buffer */ private void append(byte[] array, int off, int len) throws IOException { if (this.buffer == null) { this.buffer = this.allocator.allocate(); } this.buffer.append(array, off, len); } /** * This is used to process the bytes that have been read from the cursor. * This will keep reading bytes from the stream until such time as the zero * length chunk has been read from the stream. If the zero length chunk is * encountered then the overflow count is returned so it can be used to * reset the cursor. * * @param array * this is a chunk read from the cursor * @param off * this is the offset within the array the chunk starts * @param size * this is the number of bytes within the array * * @return this returns the number of bytes overflow that is read */ @Override protected int update(byte[] array, int off, int size) throws IOException { int mark = off + size; while (off < mark) { if (this.terminal || this.last) { while (off < mark) { if (array[off++] == '\n') { // CR[LF] if (this.last) { // 0; CRLFCR[LF] this.finished = true; return mark - off; } this.terminal = false; break; } } } else if (this.chunk == 0) { while (this.chunk == 0) { if (off >= mark) { break; } else if (array[off++] == '\n') { // CR[LF] this.parse(); if (this.chunk == 0) { // 0; CR[LF]CRLF this.last = true; break; } } else { this.line[this.count++] = array[off - 1]; } } } else { int write = Math.min(mark - off, this.chunk); this.append(array, off, write); this.chunk -= write; off += write; if (this.chunk == 0) { // []CRLF this.terminal = true; } } } return 0; } /** * This method is used to convert the size in hexidecimal to a decimal * <code>int</code>. This will use the specified number of bytes from the * internal buffer and parse each character read as a hexidecimal character. * This stops interpreting the size line when a non-hexidecimal character is * encountered. */ private void parse() throws IOException { int off = 0; while (off < this.count) { int octet = this.toDecimal(this.line[off]); if (octet < 0) { if (off < 1) throw new IOException("Invalid chunk size line"); break; } this.chunk <<= 4; this.chunk ^= octet; off++; } this.count = 0; } /** * This performs a conversion from a character to an integer. If the * character given, as a <code>byte</code>, is a hexidecimal char this will * convert it into its integer equivelant. So a char of <code>A</code> is * converted into <code>10</code>. * * @param octet * this is an ISO 8869-1 hexidecimal character * * @return returns the hex character into its decinal value */ private int toDecimal(byte octet) { if ((octet >= 'A') && (octet <= 'Z')) return (octet - 'A') + 10; if ((octet >= '0') && (octet <= '9')) return octet - '0'; if ((octet >= 'a') && (octet <= 'f')) return (octet - 'a') + 10; return -1; } }