1 /* 2 * $HeadURL: http://svn.apache.org/repos/asf/httpcomponents/httpcore/trunk/module-main/src/main/java/org/apache/http/impl/entity/LaxContentLengthStrategy.java $ 3 * $Revision: 576073 $ 4 * $Date: 2007-09-16 03:53:13 -0700 (Sun, 16 Sep 2007) $ 5 * 6 * ==================================================================== 7 * Licensed to the Apache Software Foundation (ASF) under one 8 * or more contributor license agreements. See the NOTICE file 9 * distributed with this work for additional information 10 * regarding copyright ownership. The ASF licenses this file 11 * to you under the Apache License, Version 2.0 (the 12 * "License"); you may not use this file except in compliance 13 * with the License. You may obtain a copy of the License at 14 * 15 * http://www.apache.org/licenses/LICENSE-2.0 16 * 17 * Unless required by applicable law or agreed to in writing, 18 * software distributed under the License is distributed on an 19 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY 20 * KIND, either express or implied. See the License for the 21 * specific language governing permissions and limitations 22 * under the License. 23 * ==================================================================== 24 * 25 * This software consists of voluntary contributions made by many 26 * individuals on behalf of the Apache Software Foundation. For more 27 * information on the Apache Software Foundation, please see 28 * <http://www.apache.org/>. 29 * 30 */ 31 32 package org.apache.http.impl.entity; 33 34 import org.apache.http.Header; 35 import org.apache.http.HeaderElement; 36 import org.apache.http.HttpException; 37 import org.apache.http.HttpMessage; 38 import org.apache.http.ParseException; 39 import org.apache.http.ProtocolException; 40 import org.apache.http.entity.ContentLengthStrategy; 41 import org.apache.http.params.HttpParams; 42 import org.apache.http.params.CoreProtocolPNames; 43 import org.apache.http.protocol.HTTP; 44 45 /** 46 * The lax implementation of the content length strategy. 47 * <p> 48 * This strategy conforms to the entity transfer rules outlined in 49 * <a href="http://www.w3.org/Protocols/rfc2616/rfc2616-sec3.html#sec4.4">Section 4.4</a>, 50 * <a href="http://www.w3.org/Protocols/rfc2616/rfc2616-sec3.html#sec3.6">Section 3.6</a>, 51 * <a href="http://www.w3.org/Protocols/rfc2616/rfc2616-sec14.html#sec14.41">Section 14.41</a> 52 * and <a href="http://www.w3.org/Protocols/rfc2616/rfc2616-sec3.html#sec14.13">Section 14.13</a> 53 * of <a href="http://www.w3.org/Protocols/rfc2616/rfc2616.txt">RFC 2616</a>, but is lenient 54 * about unsupported transfer codecs and malformed content-length headers. 55 * </p> 56 * <h>4.4 Message Length</h> 57 * <p> 58 * The transfer-length of a message is the length of the message-body as it appears in the 59 * message; that is, after any transfer-codings have been applied. When a message-body is 60 * included with a message, the transfer-length of that body is determined by one of the 61 * following (in order of precedence): 62 * </p> 63 * <p> 64 * 1.Any response message which "MUST NOT" include a message-body (such as the 1xx, 204, 65 * and 304 responses and any response to a HEAD request) is always terminated by the first 66 * empty line after the header fields, regardless of the entity-header fields present in the 67 * message. 68 * </p> 69 * <p> 70 * 2.If a Transfer-Encoding header field (section 14.41) is present and has any value other 71 * than "identity", then the transfer-length is defined by use of the "chunked" transfer- 72 * coding (section 3.6), unless the message is terminated by closing the connection. 73 * </p> 74 * <p> 75 * 3.If a Content-Length header field (section 14.13) is present, its decimal value in 76 * OCTETs represents both the entity-length and the transfer-length. The Content-Length 77 * header field MUST NOT be sent if these two lengths are different (i.e., if a 78 * Transfer-Encoding 79 * </p> 80 * <pre> 81 * header field is present). If a message is received with both a 82 * Transfer-Encoding header field and a Content-Length header field, 83 * the latter MUST be ignored. 84 * </pre> 85 * <p> 86 * 4.If the message uses the media type "multipart/byteranges", and the ransfer-length is not 87 * otherwise specified, then this self- elimiting media type defines the transfer-length. 88 * This media type UST NOT be used unless the sender knows that the recipient can arse it; the 89 * presence in a request of a Range header with ultiple byte- range specifiers from a 1.1 90 * client implies that the lient can parse multipart/byteranges responses. 91 * </p> 92 * <pre> 93 * A range header might be forwarded by a 1.0 proxy that does not 94 * understand multipart/byteranges; in this case the server MUST 95 * delimit the message using methods defined in items 1,3 or 5 of 96 * this section. 97 * </pre> 98 * <p> 99 * 5.By the server closing the connection. (Closing the connection cannot be used to indicate 100 * the end of a request body, since that would leave no possibility for the server to send back 101 * a response.) 102 * </p> 103 * <p> 104 * For compatibility with HTTP/1.0 applications, HTTP/1.1 requests containing a message-body 105 * MUST include a valid Content-Length header field unless the server is known to be HTTP/1.1 106 * compliant. If a request contains a message-body and a Content-Length is not given, the 107 * server SHOULD respond with 400 (bad request) if it cannot determine the length of the 108 * message, or with 411 (length required) if it wishes to insist on receiving a valid 109 * Content-Length. 110 * </p> 111 * <p>All HTTP/1.1 applications that receive entities MUST accept the "chunked" transfer-coding 112 * (section 3.6), thus allowing this mechanism to be used for messages when the message 113 * length cannot be determined in advance. 114 * </p> 115 * <h>3.6 Transfer Codings</h> 116 * <p> 117 * Transfer-coding values are used to indicate an encoding transformation that 118 * has been, can be, or may need to be applied to an entity-body in order to ensure 119 * "safe transport" through the network. This differs from a content coding in that 120 * the transfer-coding is a property of the message, not of the original entity. 121 * </p> 122 * <pre> 123 * transfer-coding = "chunked" | transfer-extension 124 * transfer-extension = token *( ";" parameter ) 125 * </pre> 126 * <p> 127 * Parameters are in the form of attribute/value pairs. 128 * </p> 129 * <pre> 130 * parameter = attribute "=" value 131 * attribute = token 132 * value = token | quoted-string 133 * </pre> 134 * <p> 135 * All transfer-coding values are case-insensitive. HTTP/1.1 uses transfer-coding values in 136 * the TE header field (section 14.39) and in the Transfer-Encoding header field (section 14.41). 137 * </p> 138 * <p> 139 * Whenever a transfer-coding is applied to a message-body, the set of transfer-codings MUST 140 * include "chunked", unless the message is terminated by closing the connection. When the 141 * "chunked" transfer-coding is used, it MUST be the last transfer-coding applied to the 142 * message-body. The "chunked" transfer-coding MUST NOT be applied more than once to a 143 * message-body. These rules allow the recipient to determine the transfer-length of the 144 * message (section 4.4). 145 * </p> 146 * <h>14.41 Transfer-Encoding</h> 147 * <p> 148 * The Transfer-Encoding general-header field indicates what (if any) type of transformation has 149 * been applied to the message body in order to safely transfer it between the sender and the 150 * recipient. This differs from the content-coding in that the transfer-coding is a property of 151 * the message, not of the entity. 152 * </p> 153 * <pre> 154 * Transfer-Encoding = "Transfer-Encoding" ":" 1#transfer-coding 155 * </pre> 156 * <p> 157 * If multiple encodings have been applied to an entity, the transfer- codings MUST be listed in 158 * the order in which they were applied. Additional information about the encoding parameters 159 * MAY be provided by other entity-header fields not defined by this specification. 160 * </p> 161 * <h>14.13 Content-Length</h> 162 * <p> 163 * The Content-Length entity-header field indicates the size of the entity-body, in decimal 164 * number of OCTETs, sent to the recipient or, in the case of the HEAD method, the size of 165 * the entity-body that would have been sent had the request been a GET. 166 * </p> 167 * <pre> 168 * Content-Length = "Content-Length" ":" 1*DIGIT 169 * </pre> 170 * <p> 171 * Applications SHOULD use this field to indicate the transfer-length of the message-body, 172 * unless this is prohibited by the rules in section 4.4. 173 * </p> 174 * 175 * @author <a href="mailto:oleg at ural.ru">Oleg Kalnichevski</a> 176 * 177 * @version $Revision: 576073 $ 178 * 179 * @since 4.0 180 */ 181 public class LaxContentLengthStrategy implements ContentLengthStrategy { 182 183 public LaxContentLengthStrategy() { 184 super(); 185 } 186 187 public long determineLength(final HttpMessage message) throws HttpException { 188 if (message == null) { 189 throw new IllegalArgumentException("HTTP message may not be null"); 190 } 191 192 HttpParams params = message.getParams(); 193 boolean strict = params.isParameterTrue(CoreProtocolPNames.STRICT_TRANSFER_ENCODING); 194 195 Header transferEncodingHeader = message.getFirstHeader(HTTP.TRANSFER_ENCODING); 196 Header contentLengthHeader = message.getFirstHeader(HTTP.CONTENT_LEN); 197 // We use Transfer-Encoding if present and ignore Content-Length. 198 // RFC2616, 4.4 item number 3 199 if (transferEncodingHeader != null) { 200 HeaderElement[] encodings = null; 201 try { 202 encodings = transferEncodingHeader.getElements(); 203 } catch (ParseException px) { 204 throw new ProtocolException 205 ("Invalid Transfer-Encoding header value: " + 206 transferEncodingHeader, px); 207 } 208 if (strict) { 209 // Currently only chunk and identity are supported 210 for (int i = 0; i < encodings.length; i++) { 211 String encoding = encodings[i].getName(); 212 if (encoding != null && encoding.length() > 0 213 && !encoding.equalsIgnoreCase(HTTP.CHUNK_CODING) 214 && !encoding.equalsIgnoreCase(HTTP.IDENTITY_CODING)) { 215 throw new ProtocolException("Unsupported transfer encoding: " + encoding); 216 } 217 } 218 } 219 // The chunked encoding must be the last one applied RFC2616, 14.41 220 int len = encodings.length; 221 if (HTTP.IDENTITY_CODING.equalsIgnoreCase(transferEncodingHeader.getValue())) { 222 return IDENTITY; 223 } else if ((len > 0) && (HTTP.CHUNK_CODING.equalsIgnoreCase( 224 encodings[len - 1].getName()))) { 225 return CHUNKED; 226 } else { 227 if (strict) { 228 throw new ProtocolException("Chunk-encoding must be the last one applied"); 229 } 230 return IDENTITY; 231 } 232 } else if (contentLengthHeader != null) { 233 long contentlen = -1; 234 Header[] headers = message.getHeaders(HTTP.CONTENT_LEN); 235 if (strict && headers.length > 1) { 236 throw new ProtocolException("Multiple content length headers"); 237 } 238 for (int i = headers.length - 1; i >= 0; i--) { 239 Header header = headers[i]; 240 try { 241 contentlen = Long.parseLong(header.getValue()); 242 break; 243 } catch (NumberFormatException e) { 244 if (strict) { 245 throw new ProtocolException("Invalid content length: " + header.getValue()); 246 } 247 } 248 // See if we can have better luck with another header, if present 249 } 250 if (contentlen >= 0) { 251 return contentlen; 252 } else { 253 return IDENTITY; 254 } 255 } else { 256 return IDENTITY; 257 } 258 } 259 260 } 261