Home | History | Annotate | Download | only in message
      1 /*
      2  * $HeadURL: http://svn.apache.org/repos/asf/httpcomponents/httpcore/trunk/module-main/src/main/java/org/apache/http/message/HeaderValueParser.java $
      3  * $Revision: 589325 $
      4  * $Date: 2007-10-28 03:37:56 -0700 (Sun, 28 Oct 2007) $
      5  *
      6  * ====================================================================
      7  * Licensed to the Apache Software Foundation (ASF) under one
      8  * or more contributor license agreements.  See the NOTICE file
      9  * distributed with this work for additional information
     10  * regarding copyright ownership.  The ASF licenses this file
     11  * to you under the Apache License, Version 2.0 (the
     12  * "License"); you may not use this file except in compliance
     13  * with the License.  You may obtain a copy of the License at
     14  *
     15  *   http://www.apache.org/licenses/LICENSE-2.0
     16  *
     17  * Unless required by applicable law or agreed to in writing,
     18  * software distributed under the License is distributed on an
     19  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
     20  * KIND, either express or implied.  See the License for the
     21  * specific language governing permissions and limitations
     22  * under the License.
     23  * ====================================================================
     24  *
     25  * This software consists of voluntary contributions made by many
     26  * individuals on behalf of the Apache Software Foundation.  For more
     27  * information on the Apache Software Foundation, please see
     28  * <http://www.apache.org/>.
     29  *
     30  */
     31 
     32 package org.apache.http.message;
     33 
     34 
     35 import org.apache.http.HeaderElement;
     36 import org.apache.http.NameValuePair;
     37 import org.apache.http.ParseException;
     38 import org.apache.http.util.CharArrayBuffer;
     39 
     40 
     41 
     42 /**
     43  * Interface for parsing header values into elements.
     44  * Instances of this interface are expected to be stateless and thread-safe.
     45  *
     46  *
     47  * <!-- empty lines above to avoid 'svn diff' context problems -->
     48  * @version $Revision: 589325 $ $Date: 2007-10-28 03:37:56 -0700 (Sun, 28 Oct 2007) $
     49  *
     50  * @since 4.0
     51  */
     52 public interface HeaderValueParser {
     53 
     54     /**
     55      * Parses a header value into elements.
     56      * Parse errors are indicated as <code>RuntimeException</code>.
     57      * <p>
     58      * Some HTTP headers (such as the set-cookie header) have values that
     59      * can be decomposed into multiple elements. In order to be processed
     60      * by this parser, such headers must be in the following form:
     61      * </p>
     62      * <pre>
     63      * header  = [ element ] *( "," [ element ] )
     64      * element = name [ "=" [ value ] ] *( ";" [ param ] )
     65      * param   = name [ "=" [ value ] ]
     66      *
     67      * name    = token
     68      * value   = ( token | quoted-string )
     69      *
     70      * token         = 1*&lt;any char except "=", ",", ";", &lt;"&gt; and
     71      *                       white space&gt;
     72      * quoted-string = &lt;"&gt; *( text | quoted-char ) &lt;"&gt;
     73      * text          = any char except &lt;"&gt;
     74      * quoted-char   = "\" char
     75      * </pre>
     76      * <p>
     77      * Any amount of white space is allowed between any part of the
     78      * header, element or param and is ignored. A missing value in any
     79      * element or param will be stored as the empty {@link String};
     80      * if the "=" is also missing <var>null</var> will be stored instead.
     81      * </p>
     82      *
     83      * @param buffer    buffer holding the header value to parse
     84      * @param cursor    the parser cursor containing the current position and
     85      *                  the bounds within the buffer for the parsing operation
     86      *
     87      * @return  an array holding all elements of the header value
     88      *
     89      * @throws ParseException        in case of a parse error
     90      */
     91     HeaderElement[] parseElements(
     92             CharArrayBuffer buffer,
     93             ParserCursor cursor) throws ParseException;
     94 
     95     /**
     96      * Parses a single header element.
     97      * A header element consist of a semicolon-separate list
     98      * of name=value definitions.
     99      *
    100      * @param buffer    buffer holding the element to parse
    101      * @param cursor    the parser cursor containing the current position and
    102      *                  the bounds within the buffer for the parsing operation
    103      *
    104      * @return  the parsed element
    105      *
    106      * @throws ParseException        in case of a parse error
    107      */
    108     HeaderElement parseHeaderElement(
    109             CharArrayBuffer buffer,
    110             ParserCursor cursor) throws ParseException;
    111 
    112     /**
    113      * Parses a list of name-value pairs.
    114      * These lists are used to specify parameters to a header element.
    115      * Parse errors are indicated as <code>RuntimeException</code>.
    116      * <p>
    117      * This method comforms to the generic grammar and formatting rules
    118      * outlined in the
    119      * <a href="http://www.w3.org/Protocols/rfc2616/rfc2616-sec2.html#sec2.2"
    120      *   >Section 2.2</a>
    121      * and
    122      * <a href="http://www.w3.org/Protocols/rfc2616/rfc2616-sec3.html#sec3.6"
    123      *   >Section 3.6</a>
    124      * of
    125      * <a href="http://www.w3.org/Protocols/rfc2616/rfc2616.txt">RFC 2616</a>.
    126      * </p>
    127      * <h>2.2 Basic Rules</h>
    128      * <p>
    129      * The following rules are used throughout this specification to
    130      * describe basic parsing constructs.
    131      * The US-ASCII coded character set is defined by ANSI X3.4-1986.
    132      * </p>
    133      * <pre>
    134      *     OCTET          = <any 8-bit sequence of data>
    135      *     CHAR           = <any US-ASCII character (octets 0 - 127)>
    136      *     UPALPHA        = <any US-ASCII uppercase letter "A".."Z">
    137      *     LOALPHA        = <any US-ASCII lowercase letter "a".."z">
    138      *     ALPHA          = UPALPHA | LOALPHA
    139      *     DIGIT          = <any US-ASCII digit "0".."9">
    140      *     CTL            = <any US-ASCII control character
    141      *                      (octets 0 - 31) and DEL (127)>
    142      *     CR             = <US-ASCII CR, carriage return (13)>
    143      *     LF             = <US-ASCII LF, linefeed (10)>
    144      *     SP             = <US-ASCII SP, space (32)>
    145      *     HT             = <US-ASCII HT, horizontal-tab (9)>
    146      *     <">            = <US-ASCII double-quote mark (34)>
    147      * </pre>
    148      * <p>
    149      * Many HTTP/1.1 header field values consist of words separated
    150      * by LWS or special characters. These special characters MUST be
    151      * in a quoted string to be used within
    152      * a parameter value (as defined in section 3.6).
    153      * <p>
    154      * <pre>
    155      * token          = 1*<any CHAR except CTLs or separators>
    156      * separators     = "(" | ")" | "<" | ">" | "@"
    157      *                | "," | ";" | ":" | "\" | <">
    158      *                | "/" | "[" | "]" | "?" | "="
    159      *                | "{" | "}" | SP | HT
    160      * </pre>
    161      * <p>
    162      * A string of text is parsed as a single word if it is quoted using
    163      * double-quote marks.
    164      * </p>
    165      * <pre>
    166      * quoted-string  = ( <"> *(qdtext | quoted-pair ) <"> )
    167      * qdtext         = <any TEXT except <">>
    168      * </pre>
    169      * <p>
    170      * The backslash character ("\") MAY be used as a single-character
    171      * quoting mechanism only within quoted-string and comment constructs.
    172      * </p>
    173      * <pre>
    174      * quoted-pair    = "\" CHAR
    175      * </pre>
    176      * <h>3.6 Transfer Codings</h>
    177      * <p>
    178      * Parameters are in the form of attribute/value pairs.
    179      * </p>
    180      * <pre>
    181      * parameter               = attribute "=" value
    182      * attribute               = token
    183      * value                   = token | quoted-string
    184      * </pre>
    185      *
    186      * @param buffer    buffer holding the name-value list to parse
    187      * @param cursor    the parser cursor containing the current position and
    188      *                  the bounds within the buffer for the parsing operation
    189      *
    190      * @return  an array holding all items of the name-value list
    191      *
    192      * @throws ParseException        in case of a parse error
    193      */
    194     NameValuePair[] parseParameters(
    195             CharArrayBuffer buffer,
    196             ParserCursor cursor) throws ParseException;
    197 
    198 
    199     /**
    200      * Parses a name=value specification, where the = and value are optional.
    201      *
    202      * @param buffer    the buffer holding the name-value pair to parse
    203      * @param cursor    the parser cursor containing the current position and
    204      *                  the bounds within the buffer for the parsing operation
    205      *
    206      * @return  the name-value pair, where the value is <code>null</code>
    207      *          if no value is specified
    208      */
    209     NameValuePair parseNameValuePair(
    210             CharArrayBuffer buffer,
    211             ParserCursor cursor) throws ParseException;
    212 
    213 }
    214 
    215