source: draft-ietf-httpbis/latest/p1-messaging.xml @ 273

Last change on this file since 273 was 273, checked in by julian.reschke@…, 11 years ago

Do not use string literals in ABNF when matching is case-sensitive (related to #36)

  • Property svn:eol-style set to native
File size: 197.0 KB
Line 
1<?xml version="1.0" encoding="utf-8"?>
2<?xml-stylesheet type='text/xsl' href='../myxml2rfc.xslt'?>
3<!DOCTYPE rfc [
4  <!ENTITY MAY "<bcp14 xmlns='http://purl.org/net/xml2rfc/ext'>MAY</bcp14>">
5  <!ENTITY MUST "<bcp14 xmlns='http://purl.org/net/xml2rfc/ext'>MUST</bcp14>">
6  <!ENTITY MUST-NOT "<bcp14 xmlns='http://purl.org/net/xml2rfc/ext'>MUST NOT</bcp14>">
7  <!ENTITY OPTIONAL "<bcp14 xmlns='http://purl.org/net/xml2rfc/ext'>OPTIONAL</bcp14>">
8  <!ENTITY RECOMMENDED "<bcp14 xmlns='http://purl.org/net/xml2rfc/ext'>RECOMMENDED</bcp14>">
9  <!ENTITY REQUIRED "<bcp14 xmlns='http://purl.org/net/xml2rfc/ext'>REQUIRED</bcp14>">
10  <!ENTITY SHALL "<bcp14 xmlns='http://purl.org/net/xml2rfc/ext'>SHALL</bcp14>">
11  <!ENTITY SHALL-NOT "<bcp14 xmlns='http://purl.org/net/xml2rfc/ext'>SHALL NOT</bcp14>">
12  <!ENTITY SHOULD "<bcp14 xmlns='http://purl.org/net/xml2rfc/ext'>SHOULD</bcp14>">
13  <!ENTITY SHOULD-NOT "<bcp14 xmlns='http://purl.org/net/xml2rfc/ext'>SHOULD NOT</bcp14>">
14  <!ENTITY ID-VERSION "latest">
15  <!ENTITY ID-MONTH "July">
16  <!ENTITY ID-YEAR "2008">
17  <!ENTITY caching                "<xref target='Part6' x:rel='#caching' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
18  <!ENTITY payload                "<xref target='Part3' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
19  <!ENTITY media-types            "<xref target='Part3' x:rel='#media.types' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
20  <!ENTITY content-codings        "<xref target='Part3' x:rel='#content.codings' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
21  <!ENTITY CONNECT                "<xref target='Part2' x:rel='#CONNECT' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
22  <!ENTITY content.negotiation    "<xref target='Part3' x:rel='#content.negotiation' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
23  <!ENTITY diff2045entity         "<xref target='Part3' x:rel='#differences.between.http.entities.and.rfc.2045.entities' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
24  <!ENTITY entity                 "<xref target='Part3' x:rel='#entity' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
25  <!ENTITY entity-body            "<xref target='Part3' x:rel='#entity.body' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
26  <!ENTITY entity-header-fields   "<xref target='Part3' x:rel='#entity.header.fields' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
27  <!ENTITY header-accept          "<xref target='Part3' x:rel='#header.accept' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
28  <!ENTITY header-cache-control   "<xref target='Part6' x:rel='#header.cache-control' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
29  <!ENTITY header-expect          "<xref target='Part2' x:rel='#header.expect' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
30  <!ENTITY header-pragma          "<xref target='Part6' x:rel='#header.pragma' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
31  <!ENTITY header-warning         "<xref target='Part6' x:rel='#header.warning' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
32  <!ENTITY idempotent-methods     "<xref target='Part2' x:rel='#idempotent.methods' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
33  <!ENTITY qvalue                 "<xref target='Part3' x:rel='#quality.values' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
34  <!ENTITY request-header-fields  "<xref target='Part2' x:rel='#request.header.fields' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
35  <!ENTITY response-header-fields "<xref target='Part2' x:rel='#response.header.fields' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
36  <!ENTITY method                 "<xref target='Part2' x:rel='#method' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
37  <!ENTITY status-codes           "<xref target='Part2' x:rel='#status.codes' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
38  <!ENTITY status-100             "<xref target='Part2' x:rel='#status.100' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
39  <!ENTITY status-1xx             "<xref target='Part2' x:rel='#status.1xx' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
40  <!ENTITY status-414             "<xref target='Part2' x:rel='#status.414' xmlns:x='http://purl.org/net/xml2rfc/ext'/>">
41]>
42<?rfc toc="yes" ?>
43<?rfc symrefs="yes" ?>
44<?rfc sortrefs="yes" ?>
45<?rfc compact="yes"?>
46<?rfc subcompact="no" ?>
47<?rfc linkmailto="no" ?>
48<?rfc editing="no" ?>
49<?rfc comments="yes"?>
50<?rfc inline="yes"?>
51<?rfc-ext allow-markup-in-artwork="yes" ?>
52<?rfc-ext include-references-in-index="yes" ?>
53<rfc obsoletes="2616" category="std"
54     ipr="full3978" docName="draft-ietf-httpbis-p1-messaging-&ID-VERSION;"
55     xmlns:x='http://purl.org/net/xml2rfc/ext'>
56<front>
57
58  <title abbrev="HTTP/1.1, Part 1">HTTP/1.1, part 1: URIs, Connections, and Message Parsing</title>
59
60  <author initials="R." surname="Fielding" fullname="Roy T. Fielding" role="editor">
61    <organization abbrev="Day Software">Day Software</organization>
62    <address>
63      <postal>
64        <street>23 Corporate Plaza DR, Suite 280</street>
65        <city>Newport Beach</city>
66        <region>CA</region>
67        <code>92660</code>
68        <country>USA</country>
69      </postal>
70      <phone>+1-949-706-5300</phone>
71      <facsimile>+1-949-706-5305</facsimile>
72      <email>fielding@gbiv.com</email>
73      <uri>http://roy.gbiv.com/</uri>
74    </address>
75  </author>
76
77  <author initials="J." surname="Gettys" fullname="Jim Gettys">
78    <organization>One Laptop per Child</organization>
79    <address>
80      <postal>
81        <street>21 Oak Knoll Road</street>
82        <city>Carlisle</city>
83        <region>MA</region>
84        <code>01741</code>
85        <country>USA</country>
86      </postal>
87      <email>jg@laptop.org</email>
88      <uri>http://www.laptop.org/</uri>
89    </address>
90  </author>
91 
92  <author initials="J." surname="Mogul" fullname="Jeffrey C. Mogul">
93    <organization abbrev="HP">Hewlett-Packard Company</organization>
94    <address>
95      <postal>
96        <street>HP Labs, Large Scale Systems Group</street>
97        <street>1501 Page Mill Road, MS 1177</street>
98        <city>Palo Alto</city>
99        <region>CA</region>
100        <code>94304</code>
101        <country>USA</country>
102      </postal>
103      <email>JeffMogul@acm.org</email>
104    </address>
105  </author>
106
107  <author initials="H." surname="Frystyk" fullname="Henrik Frystyk Nielsen">
108    <organization abbrev="Microsoft">Microsoft Corporation</organization>
109    <address>
110      <postal>
111        <street>1 Microsoft Way</street>
112        <city>Redmond</city>
113        <region>WA</region>
114        <code>98052</code>
115        <country>USA</country>
116      </postal>
117      <email>henrikn@microsoft.com</email>
118    </address>
119  </author>
120
121  <author initials="L." surname="Masinter" fullname="Larry Masinter">
122    <organization abbrev="Adobe Systems">Adobe Systems, Incorporated</organization>
123    <address>
124      <postal>
125        <street>345 Park Ave</street>
126        <city>San Jose</city>
127        <region>CA</region>
128        <code>95110</code>
129        <country>USA</country>
130      </postal>
131      <email>LMM@acm.org</email>
132      <uri>http://larry.masinter.net/</uri>
133    </address>
134  </author>
135 
136  <author initials="P." surname="Leach" fullname="Paul J. Leach">
137    <organization abbrev="Microsoft">Microsoft Corporation</organization>
138    <address>
139      <postal>
140        <street>1 Microsoft Way</street>
141        <city>Redmond</city>
142        <region>WA</region>
143        <code>98052</code>
144      </postal>
145      <email>paulle@microsoft.com</email>
146    </address>
147  </author>
148   
149  <author initials="T." surname="Berners-Lee" fullname="Tim Berners-Lee">
150    <organization abbrev="W3C/MIT">World Wide Web Consortium</organization>
151    <address>
152      <postal>
153        <street>MIT Computer Science and Artificial Intelligence Laboratory</street>
154        <street>The Stata Center, Building 32</street>
155        <street>32 Vassar Street</street>
156        <city>Cambridge</city>
157        <region>MA</region>
158        <code>02139</code>
159        <country>USA</country>
160      </postal>
161      <email>timbl@w3.org</email>
162      <uri>http://www.w3.org/People/Berners-Lee/</uri>
163    </address>
164  </author>
165
166  <author initials="Y." surname="Lafon" fullname="Yves Lafon" role="editor">
167    <organization abbrev="W3C">World Wide Web Consortium</organization>
168    <address>
169      <postal>
170        <street>W3C / ERCIM</street>
171        <street>2004, rte des Lucioles</street>
172        <city>Sophia-Antipolis</city>
173        <region>AM</region>
174        <code>06902</code>
175        <country>France</country>
176      </postal>
177      <email>ylafon@w3.org</email>
178      <uri>http://www.raubacapeu.net/people/yves/</uri>
179    </address>
180  </author>
181
182  <author initials="J. F." surname="Reschke" fullname="Julian F. Reschke" role="editor">
183    <organization abbrev="greenbytes">greenbytes GmbH</organization>
184    <address>
185      <postal>
186        <street>Hafenweg 16</street>
187        <city>Muenster</city><region>NW</region><code>48155</code>
188        <country>Germany</country>
189      </postal>
190      <phone>+49 251 2807760</phone>   
191      <facsimile>+49 251 2807761</facsimile>   
192      <email>julian.reschke@greenbytes.de</email>       
193      <uri>http://greenbytes.de/tech/webdav/</uri>     
194    </address>
195  </author>
196
197  <date month="&ID-MONTH;" year="&ID-YEAR;"/>
198
199<abstract>
200<t>
201   The Hypertext Transfer Protocol (HTTP) is an application-level
202   protocol for distributed, collaborative, hypermedia information
203   systems. HTTP has been in use by the World Wide Web global information
204   initiative since 1990. This document is Part 1 of the seven-part specification
205   that defines the protocol referred to as "HTTP/1.1" and, taken together,
206   obsoletes RFC 2616.  Part 1 provides an overview of HTTP and
207   its associated terminology, defines the "http" and "https" Uniform
208   Resource Identifier (URI) schemes, defines the generic message syntax
209   and parsing requirements for HTTP message frames, and describes
210   general security concerns for implementations.
211</t>
212</abstract>
213
214<note title="Editorial Note (To be removed by RFC Editor)">
215  <t>
216    Discussion of this draft should take place on the HTTPBIS working group
217    mailing list (ietf-http-wg@w3.org). The current issues list is
218    at <eref target="http://www.tools.ietf.org/wg/httpbis/trac/report/11"/>
219    and related documents (including fancy diffs) can be found at
220    <eref target="http://www.tools.ietf.org/wg/httpbis/"/>.
221  </t>
222  <t>
223    The changes in this draft are summarized in <xref target="changes.since.02"/>.
224  </t>
225</note>
226</front>
227<middle>
228<section title="Introduction" anchor="introduction">
229<t>
230   The Hypertext Transfer Protocol (HTTP) is an application-level
231   protocol for distributed, collaborative, hypermedia information
232   systems. HTTP has been in use by the World-Wide Web global
233   information initiative since 1990. The first version of HTTP, commonly
234   referred to as HTTP/0.9, was a simple protocol for raw data transfer
235   across the Internet with only a single method and no metadata.
236   HTTP/1.0, as defined by <xref target="RFC1945"/>, improved
237   the protocol by allowing messages to be in the format of MIME-like
238   messages, containing metadata about the data transferred and
239   modifiers on the request/response semantics. However, HTTP/1.0 did
240   not sufficiently take into consideration the effects of hierarchical
241   proxies, caching, the need for persistent connections, or name-based
242   virtual hosts. In addition, the proliferation of incompletely-implemented
243   applications calling themselves "HTTP/1.0" necessitated a
244   protocol version change in order for two communicating applications
245   to determine each other's true capabilities.
246</t>
247<t>
248   This document is Part 1 of the seven-part specification that defines
249   the protocol referred to as "HTTP/1.1", obsoleting <xref target="RFC2616"/>.
250   HTTP/1.1 remains compatible with HTTP/1.0 by including more stringent
251   requirements that enable reliable implementations and adding only
252   those new features that will either be safely ignored by an HTTP/1.0
253   recipient or only sent when communicating with a party advertising
254   compliance with HTTP/1.1.
255   Part 1 defines those aspects of HTTP/1.1 related to overall network
256   operation, message framing, interaction with transport protocols, and
257   URI schemes.
258</t>
259<t>
260   This document is currently disorganized in order to minimize the changes
261   between drafts and enable reviewers to see the smaller errata changes.
262   The next draft will reorganize the sections to better reflect the content.
263   In particular, the sections will be organized according to the typical
264   process of deciding when to use HTTP (URI schemes), overall network operation,
265   connection management, message framing, and generic message parsing.
266   The current mess reflects how widely dispersed these topics and associated
267   requirements had become in <xref target="RFC2616"/>.
268</t>
269
270<section title="Purpose" anchor="intro.purpose">
271<t>
272   Practical information systems require more functionality than simple
273   retrieval, including search, front-end update, and annotation. HTTP
274   allows an open-ended set of methods and headers that indicate the
275   purpose of a request <xref target="RFC2324"/>. It builds on the discipline of reference
276   provided by the Uniform Resource Identifier (URI) <xref target="RFC1630"/>, as a location
277   (URL) <xref target="RFC1738"/> or name (URN) <xref target="RFC1737"/>, for indicating the resource to which a
278   method is to be applied. Messages are passed in a format similar to
279   that used by Internet mail <xref target="RFC2822"/> as defined by the Multipurpose
280   Internet Mail Extensions (MIME) <xref target="RFC2045"/>.
281</t>
282<t>
283   HTTP is also used as a generic protocol for communication between
284   user agents and proxies/gateways to other Internet systems, including
285   those supported by the SMTP <xref target="RFC2821"/>, NNTP <xref target="RFC3977"/>, FTP <xref target="RFC959"/>, Gopher <xref target="RFC1436"/>,
286   and WAIS <xref target="WAIS"/> protocols. In this way, HTTP allows basic hypermedia
287   access to resources available from diverse applications.
288</t>
289</section>
290
291<section title="Requirements" anchor="intro.requirements">
292<t>
293   The key words "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT",
294   "SHOULD", "SHOULD NOT", "RECOMMENDED", "MAY", and "OPTIONAL" in this
295   document are to be interpreted as described in <xref target="RFC2119"/>.
296</t>
297<t>
298   An implementation is not compliant if it fails to satisfy one or more
299   of the &MUST; or &REQUIRED; level requirements for the protocols it
300   implements. An implementation that satisfies all the &MUST; or &REQUIRED;
301   level and all the &SHOULD; level requirements for its protocols is said
302   to be "unconditionally compliant"; one that satisfies all the &MUST;
303   level requirements but not all the &SHOULD; level requirements for its
304   protocols is said to be "conditionally compliant."
305</t>
306</section>
307
308<section title="Terminology" anchor="intro.terminology">
309<t>
310   This specification uses a number of terms to refer to the roles
311   played by participants in, and objects of, the HTTP communication.
312</t>
313<t>
314  <iref item="connection"/>
315  <x:dfn>connection</x:dfn>
316  <list>
317    <t>
318      A transport layer virtual circuit established between two programs
319      for the purpose of communication.
320    </t>
321  </list>
322</t>
323<t>
324  <iref item="message"/>
325  <x:dfn>message</x:dfn>
326  <list>
327    <t>
328      The basic unit of HTTP communication, consisting of a structured
329      sequence of octets matching the syntax defined in <xref target="http.message"/> and
330      transmitted via the connection.
331    </t>
332  </list>
333</t>
334<t>
335  <iref item="request"/>
336  <x:dfn>request</x:dfn>
337  <list>
338    <t>
339      An HTTP request message, as defined in <xref target="request"/>.
340    </t>
341  </list>
342</t>
343<t>
344  <iref item="response"/>
345  <x:dfn>response</x:dfn>
346  <list>
347    <t>
348      An HTTP response message, as defined in <xref target="response"/>.
349    </t>
350  </list>
351</t>
352<t>
353  <iref item="resource"/>
354  <x:dfn>resource</x:dfn>
355  <list>
356    <t>
357      A network data object or service that can be identified by a URI,
358      as defined in <xref target="uri"/>. Resources may be available in multiple
359      representations (e.g. multiple languages, data formats, size, and
360      resolutions) or vary in other ways.
361    </t>
362  </list>
363</t>
364<t>
365  <iref item="entity"/>
366  <x:dfn>entity</x:dfn>
367  <list>
368    <t>
369      The information transferred as the payload of a request or
370      response. An entity consists of metainformation in the form of
371      entity-header fields and content in the form of an entity-body, as
372      described in &entity;.
373    </t>
374  </list>
375</t>
376<t>
377  <iref item="representation"/>
378  <x:dfn>representation</x:dfn>
379  <list>
380    <t>
381      An entity included with a response that is subject to content
382      negotiation, as described in &content.negotiation;. There may exist multiple
383      representations associated with a particular response status.
384    </t>
385  </list>
386</t>
387<t>
388  <iref item="content negotiation"/>
389  <x:dfn>content negotiation</x:dfn>
390  <list>
391    <t>
392      The mechanism for selecting the appropriate representation when
393      servicing a request, as described in &content.negotiation;. The
394      representation of entities in any response can be negotiated
395      (including error responses).
396    </t>
397  </list>
398</t>
399<t>
400  <iref item="variant"/>
401  <x:dfn>variant</x:dfn>
402  <list>
403    <t>
404      A resource may have one, or more than one, representation(s)
405      associated with it at any given instant. Each of these
406      representations is termed a `variant'.  Use of the term `variant'
407      does not necessarily imply that the resource is subject to content
408      negotiation.
409    </t>
410  </list>
411</t>
412<t>
413  <iref item="client"/>
414  <x:dfn>client</x:dfn>
415  <list>
416    <t>
417      A program that establishes connections for the purpose of sending
418      requests.
419    </t>
420  </list>
421</t>
422<t>
423  <iref item="user agent"/>
424  <x:dfn>user agent</x:dfn>
425  <list>
426    <t>
427      The client which initiates a request. These are often browsers,
428      editors, spiders (web-traversing robots), or other end user tools.
429    </t>
430  </list>
431</t>
432<t>
433  <iref item="server"/>
434  <x:dfn>server</x:dfn>
435  <list>
436    <t>
437      An application program that accepts connections in order to
438      service requests by sending back responses. Any given program may
439      be capable of being both a client and a server; our use of these
440      terms refers only to the role being performed by the program for a
441      particular connection, rather than to the program's capabilities
442      in general. Likewise, any server may act as an origin server,
443      proxy, gateway, or tunnel, switching behavior based on the nature
444      of each request.
445    </t>
446  </list>
447</t>
448<t>
449  <iref item="origin server"/>
450  <x:dfn>origin server</x:dfn>
451  <list>
452    <t>
453      The server on which a given resource resides or is to be created.
454    </t>
455  </list>
456</t>
457<t>
458  <iref item="proxy"/>
459  <x:dfn>proxy</x:dfn>
460  <list>
461    <t>
462      An intermediary program which acts as both a server and a client
463      for the purpose of making requests on behalf of other clients.
464      Requests are serviced internally or by passing them on, with
465      possible translation, to other servers. A proxy &MUST; implement
466      both the client and server requirements of this specification. A
467      "transparent proxy" is a proxy that does not modify the request or
468      response beyond what is required for proxy authentication and
469      identification. A "non-transparent proxy" is a proxy that modifies
470      the request or response in order to provide some added service to
471      the user agent, such as group annotation services, media type
472      transformation, protocol reduction, or anonymity filtering. Except
473      where either transparent or non-transparent behavior is explicitly
474      stated, the HTTP proxy requirements apply to both types of
475      proxies.
476    </t>
477  </list>
478</t>
479<t>
480  <iref item="gateway"/>
481  <x:dfn>gateway</x:dfn>
482  <list>
483    <t>
484      A server which acts as an intermediary for some other server.
485      Unlike a proxy, a gateway receives requests as if it were the
486      origin server for the requested resource; the requesting client
487      may not be aware that it is communicating with a gateway.
488    </t>
489  </list>
490</t>
491<t>
492  <iref item="tunnel"/>
493  <x:dfn>tunnel</x:dfn>
494  <list>
495    <t>
496      An intermediary program which is acting as a blind relay between
497      two connections. Once active, a tunnel is not considered a party
498      to the HTTP communication, though the tunnel may have been
499      initiated by an HTTP request. The tunnel ceases to exist when both
500      ends of the relayed connections are closed.
501    </t>
502  </list>
503</t>
504<t>
505  <iref item="cache"/>
506  <x:dfn>cache</x:dfn>
507  <list>
508    <t>
509      A program's local store of response messages and the subsystem
510      that controls its message storage, retrieval, and deletion. A
511      cache stores cacheable responses in order to reduce the response
512      time and network bandwidth consumption on future, equivalent
513      requests. Any client or server may include a cache, though a cache
514      cannot be used by a server that is acting as a tunnel.
515    </t>
516  </list>
517</t>
518<t>
519  <iref item="cacheable"/>
520  <x:dfn>cacheable</x:dfn>
521  <list>
522    <t>
523      A response is cacheable if a cache is allowed to store a copy of
524      the response message for use in answering subsequent requests. The
525      rules for determining the cacheability of HTTP responses are
526      defined in &caching;. Even if a resource is cacheable, there may
527      be additional constraints on whether a cache can use the cached
528      copy for a particular request.
529    </t>
530  </list>
531</t>
532<t>
533  <iref item="upstream"/>
534  <iref item="downstream"/>
535  <x:dfn>upstream</x:dfn>/<x:dfn>downstream</x:dfn>
536  <list>
537    <t>
538      Upstream and downstream describe the flow of a message: all
539      messages flow from upstream to downstream.
540    </t>
541  </list>
542</t>
543<t>
544  <iref item="inbound"/>
545  <iref item="outbound"/>
546  <x:dfn>inbound</x:dfn>/<x:dfn>outbound</x:dfn>
547  <list>
548    <t>
549      Inbound and outbound refer to the request and response paths for
550      messages: "inbound" means "traveling toward the origin server",
551      and "outbound" means "traveling toward the user agent"
552    </t>
553  </list>
554</t>
555</section>
556
557<section title="Overall Operation" anchor="intro.overall.operation">
558<t>
559   HTTP is a request/response protocol. A client sends a
560   request to the server in the form of a request method, URI, and
561   protocol version, followed by a MIME-like message containing request
562   modifiers, client information, and possible body content over a
563   connection with a server. The server responds with a status line,
564   including the message's protocol version and a success or error code,
565   followed by a MIME-like message containing server information, entity
566   metainformation, and possible entity-body content. The relationship
567   between HTTP and MIME is described in &diff2045entity;.
568</t>
569<t>
570   Most HTTP communication is initiated by a user agent and consists of
571   a request to be applied to a resource on some origin server. In the
572   simplest case, this may be accomplished via a single connection (v)
573   between the user agent (UA) and the origin server (O).
574</t>
575<figure><artwork type="drawing">
576       request chain ------------------------&gt;
577    UA -------------------v------------------- O
578       &lt;----------------------- response chain
579</artwork></figure>
580<t>
581   A more complicated situation occurs when one or more intermediaries
582   are present in the request/response chain. There are three common
583   forms of intermediary: proxy, gateway, and tunnel. A proxy is a
584   forwarding agent, receiving requests for a URI in its absolute form,
585   rewriting all or part of the message, and forwarding the reformatted
586   request toward the server identified by the URI. A gateway is a
587   receiving agent, acting as a layer above some other server(s) and, if
588   necessary, translating the requests to the underlying server's
589   protocol. A tunnel acts as a relay point between two connections
590   without changing the messages; tunnels are used when the
591   communication needs to pass through an intermediary (such as a
592   firewall) even when the intermediary cannot understand the contents
593   of the messages.
594</t>
595<figure><artwork type="drawing">
596       request chain --------------------------------------&gt;
597    UA -----v----- A -----v----- B -----v----- C -----v----- O
598       &lt;------------------------------------- response chain
599</artwork></figure>
600<t>
601   The figure above shows three intermediaries (A, B, and C) between the
602   user agent and origin server. A request or response message that
603   travels the whole chain will pass through four separate connections.
604   This distinction is important because some HTTP communication options
605   may apply only to the connection with the nearest, non-tunnel
606   neighbor, only to the end-points of the chain, or to all connections
607   along the chain. Although the diagram is linear, each participant may
608   be engaged in multiple, simultaneous communications. For example, B
609   may be receiving requests from many clients other than A, and/or
610   forwarding requests to servers other than C, at the same time that it
611   is handling A's request.
612</t>
613<t>
614   Any party to the communication which is not acting as a tunnel may
615   employ an internal cache for handling requests. The effect of a cache
616   is that the request/response chain is shortened if one of the
617   participants along the chain has a cached response applicable to that
618   request. The following illustrates the resulting chain if B has a
619   cached copy of an earlier response from O (via C) for a request which
620   has not been cached by UA or A.
621</t>
622<figure><artwork type="drawing">
623          request chain ----------&gt;
624       UA -----v----- A -----v----- B - - - - - - C - - - - - - O
625          &lt;--------- response chain
626</artwork></figure>
627<t>
628   Not all responses are usefully cacheable, and some requests may
629   contain modifiers which place special requirements on cache behavior.
630   HTTP requirements for cache behavior and cacheable responses are
631   defined in &caching;.
632</t>
633<t>
634   In fact, there are a wide variety of architectures and configurations
635   of caches and proxies currently being experimented with or deployed
636   across the World Wide Web. These systems include national hierarchies
637   of proxy caches to save transoceanic bandwidth, systems that
638   broadcast or multicast cache entries, organizations that distribute
639   subsets of cached data via CD-ROM, and so on. HTTP systems are used
640   in corporate intranets over high-bandwidth links, and for access via
641   PDAs with low-power radio links and intermittent connectivity. The
642   goal of HTTP/1.1 is to support the wide diversity of configurations
643   already deployed while introducing protocol constructs that meet the
644   needs of those who build web applications that require high
645   reliability and, failing that, at least reliable indications of
646   failure.
647</t>
648<t>
649   HTTP communication usually takes place over TCP/IP connections. The
650   default port is TCP 80 (<eref target="http://www.iana.org/assignments/port-numbers"/>), but other ports can be used. This does
651   not preclude HTTP from being implemented on top of any other protocol
652   on the Internet, or on other networks. HTTP only presumes a reliable
653   transport; any protocol that provides such guarantees can be used;
654   the mapping of the HTTP/1.1 request and response structures onto the
655   transport data units of the protocol in question is outside the scope
656   of this specification.
657</t>
658<t>
659   In HTTP/1.0, most implementations used a new connection for each
660   request/response exchange. In HTTP/1.1, a connection may be used for
661   one or more request/response exchanges, although connections may be
662   closed for a variety of reasons (see <xref target="persistent.connections"/>).
663</t>
664</section>
665</section>
666
667<section title="Notational Conventions and Generic Grammar" anchor="notation">
668
669<section title="Augmented BNF" anchor="notation.abnf">
670<t>
671   All of the mechanisms specified in this document are described in
672   both prose and an augmented Backus-Naur Form (BNF) similar to that
673   used by <xref target="RFC822ABNF"/>. Implementors will need to be familiar with the
674   notation in order to understand this specification. The augmented BNF
675   includes the following constructs:
676</t>
677<t>
678   name = definition
679  <list>
680    <t>
681      The name of a rule is simply the name itself (without any
682      enclosing "&lt;" and "&gt;") and is separated from its definition by the
683      equal "=" character. White space is only significant in that
684      indentation of continuation lines is used to indicate a rule
685      definition that spans more than one line. Certain basic rules are
686      in uppercase, such as SP, LWS, HTAB, CRLF, DIGIT, ALPHA, etc. Angle
687      brackets are used within definitions whenever their presence will
688      facilitate discerning the use of rule names.
689    </t>
690  </list>
691</t>
692<t>
693   "literal"
694  <list>
695    <t>
696      Quotation marks surround literal text. Unless stated otherwise,
697      the text is case-insensitive.
698    </t>
699  </list>
700</t>
701<t>
702   rule1 | rule2
703  <list>
704    <t>
705      Elements separated by a bar ("|") are alternatives, e.g., "yes |
706      no" will accept yes or no.
707    </t>
708  </list>
709</t>
710<t>
711   (rule1 rule2)
712  <list>
713    <t>
714      Elements enclosed in parentheses are treated as a single element.
715      Thus, "(elem (foo | bar) elem)" allows the token sequences "elem
716      foo elem" and "elem bar elem".
717    </t>
718  </list>
719</t>
720<t>
721   *rule
722  <list>
723    <t>
724      The character "*" preceding an element indicates repetition. The
725      full form is "&lt;n&gt;*&lt;m&gt;element" indicating at least &lt;n&gt; and at most
726      &lt;m&gt; occurrences of element. Default values are 0 and infinity so
727      that "*(element)" allows any number, including zero; "1*element"
728      requires at least one; and "1*2element" allows one or two.
729    </t>
730  </list>
731</t>
732<t>
733   [rule]
734  <list>
735    <t>
736      Square brackets enclose optional elements; "[foo bar]" is
737      equivalent to "*1(foo bar)".
738    </t>
739  </list>
740</t>
741<t>
742   N rule
743  <list>
744    <t>
745      Specific repetition: "&lt;n&gt;(element)" is equivalent to
746      "&lt;n&gt;*&lt;n&gt;(element)"; that is, exactly &lt;n&gt; occurrences of (element).
747      Thus 2DIGIT is a 2-digit number, and 3ALPHA is a string of three
748      alphabetic characters.
749    </t>
750  </list>
751</t>
752<t>
753   #rule
754  <list>
755    <t>
756      A construct "#" is defined, similar to "*", for defining lists of
757      elements. The full form is "&lt;n&gt;#&lt;m&gt;element" indicating at least
758      &lt;n&gt; and at most &lt;m&gt; elements, each separated by one or more commas
759      (",") and &OPTIONAL; linear white space (LWS). This makes the usual
760      form of lists very easy; a rule such as
761      <figure><artwork type="example">
762   ( *<x:ref>LWS</x:ref> element *( *<x:ref>LWS</x:ref> "," *<x:ref>LWS</x:ref> element ))</artwork></figure>
763    </t>
764    <t>
765      can be shown as
766      <figure><artwork type="example">
767   1#element</artwork></figure>
768    </t>
769    <t>
770      Wherever this construct is used, null elements are allowed, but do
771      not contribute to the count of elements present. That is,
772      "(element), , (element) " is permitted, but counts as only two
773      elements. Therefore, where at least one element is required, at
774      least one non-null element &MUST; be present. Default values are 0
775      and infinity so that "#element" allows any number, including zero;
776      "1#element" requires at least one; and "1#2element" allows one or
777      two.
778    </t>
779  </list>
780</t>
781<t>
782   ; comment
783  <list>
784    <t>
785      A semi-colon, set off some distance to the right of rule text,
786      starts a comment that continues to the end of line. This is a
787      simple way of including useful notes in parallel with the
788      specifications.
789    </t>
790  </list>
791</t>
792<t anchor="implied.LWS">
793  <iref item="implied *LWS" primary="true"/>
794   implied *LWS
795  <list>
796    <t>
797      The grammar described by this specification is word-based. Except
798      where noted otherwise, linear white space (LWS) can be included
799      between any two adjacent words (token or quoted-string), and
800      between adjacent words and separators, without changing the
801      interpretation of a field. At least one delimiter (LWS and/or
802      separators) &MUST; exist between any two tokens (for the definition
803      of "token" below), since they would otherwise be interpreted as a
804      single token.
805    </t>
806  </list>
807</t>
808</section>
809
810<section title="Basic Rules" anchor="basic.rules">
811<t anchor="core.rules">
812  <x:anchor-alias value="OCTET"/>
813  <x:anchor-alias value="CHAR"/>
814  <x:anchor-alias value="ALPHA"/>
815  <x:anchor-alias value="DIGIT"/>
816  <x:anchor-alias value="CTL"/>
817  <x:anchor-alias value="CR"/>
818  <x:anchor-alias value="LF"/>
819  <x:anchor-alias value="SP"/>
820  <x:anchor-alias value="HTAB"/>
821  <x:anchor-alias value="DQUOTE"/>
822   The following rules are used throughout this specification to
823   describe basic parsing constructs. The US-ASCII coded character set
824   is defined by ANSI X3.4-1986 <xref target="USASCII"/>.
825</t>
826<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="OCTET"/><iref primary="true" item="Grammar" subitem="CHAR"/><iref primary="true" item="Grammar" subitem="ALPHA"/><iref primary="true" item="Grammar" subitem="DIGIT"/><iref primary="true" item="Grammar" subitem="CTL"/><iref primary="true" item="Grammar" subitem="CR"/><iref primary="true" item="Grammar" subitem="LF"/><iref primary="true" item="Grammar" subitem="SP"/><iref primary="true" item="Grammar" subitem="HTAB"/><iref primary="true" item="Grammar" subitem="DQUOTE"/>
827  <x:ref>OCTET</x:ref>          = %x00-FF
828                   ; any 8-bit sequence of data
829  <x:ref>CHAR</x:ref>           = %x01-7F
830                   ; any US-ASCII character, excluding NUL
831  <x:ref>ALPHA</x:ref>          = %x41-5A | %x61-7A
832                   ; A-Z | a-z
833  <x:ref>DIGIT</x:ref>          = %x30-39
834                   ; any US-ASCII digit "0".."9"
835  <x:ref>CTL</x:ref>            = %x00-1F | %x7F
836                   ; (octets 0 - 31) and DEL (127)
837  <x:ref>CR</x:ref>             = %x0D
838                   ; US-ASCII CR, carriage return (13)
839  <x:ref>LF</x:ref>             = %x0A
840                   ; US-ASCII LF, linefeed (10)
841  <x:ref>SP</x:ref>             = %x20
842                   ; US-ASCII SP, space (32)
843  <x:ref>HTAB</x:ref>           = %x09
844                   ; US-ASCII HT, horizontal-tab (9)
845  <x:ref>DQUOTE</x:ref>         = %x22
846                   ; US-ASCII double-quote mark (34)
847</artwork></figure>
848<t anchor="rule.CRLF">
849  <x:anchor-alias value="CRLF"/>
850   HTTP/1.1 defines the sequence CR LF as the end-of-line marker for all
851   protocol elements except the entity-body (see <xref target="tolerant.applications"/> for
852   tolerant applications). The end-of-line marker within an entity-body
853   is defined by its associated media type, as described in &media-types;.
854</t>
855<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="CRLF"/>
856  <x:ref>CRLF</x:ref>           = <x:ref>CR</x:ref> LF
857</artwork></figure>
858<t anchor="rule.LWS">
859  <x:anchor-alias value="LWS"/>
860   HTTP/1.1 header field values can be folded onto multiple lines if the
861   continuation line begins with a space or horizontal tab. All linear
862   white space, including folding, has the same semantics as SP. A
863   recipient &MAY; replace any linear white space with a single SP before
864   interpreting the field value or forwarding the message downstream.
865</t>
866<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="LWS"/>
867  <x:ref>LWS</x:ref>            = [<x:ref>CRLF</x:ref>] 1*( <x:ref>SP</x:ref> | <x:ref>HTAB</x:ref> )
868</artwork></figure>
869<t anchor="rule.TEXT">
870  <x:anchor-alias value="TEXT"/>
871   The TEXT rule is only used for descriptive field contents and values
872   that are not intended to be interpreted by the message parser. Words
873   of *TEXT &MAY; contain characters from character sets other than ISO-8859-1
874   <xref target="ISO-8859-1"/> only when encoded according to the rules of
875   <xref target="RFC2047"/>.
876</t>
877<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="TEXT"/>
878  <x:ref>TEXT</x:ref>           = %x20-7E | %x80-FF | <x:ref>LWS</x:ref>
879                 ; any <x:ref>OCTET</x:ref> except <x:ref>CTL</x:ref>s, but including <x:ref>LWS</x:ref>
880</artwork></figure>
881<t>
882   A CRLF is allowed in the definition of TEXT only as part of a header
883   field continuation. It is expected that the folding LWS will be
884   replaced with a single SP before interpretation of the TEXT value.
885</t>
886<t anchor="rule.HEX">
887  <x:anchor-alias value="HEX"/>
888   Hexadecimal numeric characters are used in several protocol elements.
889</t>
890<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="HEX"/>
891  <x:ref>HEX</x:ref>            = "A" | "B" | "C" | "D" | "E" | "F"
892                 | "a" | "b" | "c" | "d" | "e" | "f" | <x:ref>DIGIT</x:ref>
893</artwork></figure>
894<t anchor="rule.token.separators">
895  <x:anchor-alias value="tchar"/>
896  <x:anchor-alias value="token"/>
897  <x:anchor-alias value="separators"/>
898   Many HTTP/1.1 header field values consist of words separated by LWS
899   or special characters. These special characters &MUST; be in a quoted
900   string to be used within a parameter value (as defined in
901   <xref target="transfer.codings"/>).
902</t>
903<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="token"/><iref primary="true" item="Grammar" subitem="tchar"/><iref primary="true" item="Grammar" subitem="separators"/>
904  <x:ref>separators</x:ref>     = "(" | ")" | "&lt;" | "&gt;" | "@"
905                 | "," | ";" | ":" | "\" | <x:ref>DQUOTE</x:ref>
906                 | "/" | "[" | "]" | "?" | "="
907                 | "{" | "}" | <x:ref>SP</x:ref> | <x:ref>HTAB</x:ref>
908                 
909  <x:ref>tchar</x:ref>          = "!" | "#" | "$" | "%" | "&amp;" | "'" | "*"
910                 | "+" | "-" | "." | "^" | "_" | "`" | "|" | "~"
911                 | <x:ref>DIGIT</x:ref> | <x:ref>ALPHA</x:ref>
912                 ; any <x:ref>CHAR</x:ref> except <x:ref>CTL</x:ref>s or <x:ref>separators</x:ref>
913                 
914  <x:ref>token</x:ref>          = 1*<x:ref>tchar</x:ref>
915</artwork></figure>
916<t anchor="rule.comment">
917  <x:anchor-alias value="comment"/>
918  <x:anchor-alias value="ctext"/>
919   Comments can be included in some HTTP header fields by surrounding
920   the comment text with parentheses. Comments are only allowed in
921   fields containing "comment" as part of their field value definition.
922   In all other fields, parentheses are considered part of the field
923   value.
924</t>
925<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="comment"/><iref primary="true" item="Grammar" subitem="ctext"/>
926  <x:ref>comment</x:ref>        = "(" *( <x:ref>ctext</x:ref> | <x:ref>quoted-pair</x:ref> | <x:ref>comment</x:ref> ) ")"
927  <x:ref>ctext</x:ref>          = &lt;any <x:ref>TEXT</x:ref> excluding "(" and ")"&gt;
928</artwork></figure>
929<t anchor="rule.quoted-string">
930  <x:anchor-alias value="quoted-string"/>
931  <x:anchor-alias value="qdtext"/>
932   A string of text is parsed as a single word if it is quoted using
933   double-quote marks.
934</t>
935<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="quoted-string"/><iref primary="true" item="Grammar" subitem="qdtext"/>
936  <x:ref>quoted-string</x:ref>  = ( <x:ref>DQUOTE</x:ref> *(<x:ref>qdtext</x:ref> | <x:ref>quoted-pair</x:ref> ) <x:ref>DQUOTE</x:ref> )
937  <x:ref>qdtext</x:ref>         = &lt;any <x:ref>TEXT</x:ref> excluding <x:ref>DQUOTE</x:ref> and "\">
938</artwork></figure>
939<t anchor="rule.quoted-pair">
940  <x:anchor-alias value="quoted-pair"/>
941  <x:anchor-alias value="quoted-text"/>
942   The backslash character ("\") &MAY; be used as a single-character
943   quoting mechanism only within quoted-string and comment constructs.
944</t>
945<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="quoted-text"/><iref primary="true" item="Grammar" subitem="quoted-pair"/>
946  <x:ref>quoted-text</x:ref>    = %x01-09 |
947                   %x0B-0C |
948                   %x0E-FF ; Characters excluding NUL, <x:ref>CR</x:ref> and <x:ref>LF</x:ref>
949  <x:ref>quoted-pair</x:ref>    = "\" <x:ref>quoted-text</x:ref>
950</artwork></figure>
951</section>
952
953<section title="ABNF Rules defined in other Parts of the Specification" anchor="abnf.dependencies">
954  <x:anchor-alias value="request-header"/>
955  <x:anchor-alias value="response-header"/>
956  <x:anchor-alias value="accept-params"/>
957  <x:anchor-alias value="entity-body"/>
958  <x:anchor-alias value="entity-header"/>
959  <x:anchor-alias value="Cache-Control"/>
960  <x:anchor-alias value="Pragma"/>
961  <x:anchor-alias value="Warning"/>
962<t>
963  The ABNF rules below are defined in other parts:
964</t>
965<figure><!-- Part2--><artwork type="abnf2616">
966  <x:ref>request-header</x:ref>  = &lt;request-header, defined in &request-header-fields;&gt;
967  <x:ref>response-header</x:ref> = &lt;response-header, defined in &response-header-fields;&gt;
968</artwork></figure>
969<figure><!-- Part3--><artwork type="abnf2616">
970  <x:ref>accept-params</x:ref>   = &lt;accept-params, defined in &header-accept;&gt;
971  <x:ref>entity-body</x:ref>     = &lt;entity-body, defined in &entity-body;&gt;
972  <x:ref>entity-header</x:ref>   = &lt;entity-header, defined in &entity-header-fields;&gt;
973</artwork></figure>
974<figure><!-- Part6--><artwork type="abnf2616">
975  <x:ref>Cache-Control</x:ref>   = &lt;Cache-Control, defined in &header-pragma;&gt;
976  <x:ref>Pragma</x:ref>          = &lt;Pragma, defined in &header-pragma;&gt;
977  <x:ref>Warning</x:ref>         = &lt;Warning, defined in &header-warning;&gt;
978</artwork></figure>
979</section>
980
981</section>
982
983<section title="Protocol Parameters" anchor="protocol.parameters">
984
985<section title="HTTP Version" anchor="http.version">
986  <x:anchor-alias value="HTTP-Version"/>
987  <x:anchor-alias value="HTTP-Prot-Name"/>
988<t>
989   HTTP uses a "&lt;major&gt;.&lt;minor&gt;" numbering scheme to indicate versions
990   of the protocol. The protocol versioning policy is intended to allow
991   the sender to indicate the format of a message and its capacity for
992   understanding further HTTP communication, rather than the features
993   obtained via that communication. No change is made to the version
994   number for the addition of message components which do not affect
995   communication behavior or which only add to extensible field values.
996   The &lt;minor&gt; number is incremented when the changes made to the
997   protocol add features which do not change the general message parsing
998   algorithm, but which may add to the message semantics and imply
999   additional capabilities of the sender. The &lt;major&gt; number is
1000   incremented when the format of a message within the protocol is
1001   changed. See <xref target="RFC2145"/> for a fuller explanation.
1002</t>
1003<t>
1004   The version of an HTTP message is indicated by an HTTP-Version field
1005   in the first line of the message. HTTP-Version is case-sensitive.
1006</t>
1007<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="HTTP-Version"/><iref primary="true" item="Grammar" subitem="HTTP-Prot-Name"/>
1008  <x:ref>HTTP-Version</x:ref>   = <x:ref>HTTP-Prot-Name</x:ref> "/" 1*<x:ref>DIGIT</x:ref> "." 1*<x:ref>DIGIT</x:ref>
1009  <x:ref>HTTP-Prot-Name</x:ref> = <x:abnf-char-sequence>"HTTP"</x:abnf-char-sequence> ; "HTTP", case-sensitive
1010</artwork></figure>
1011<t>
1012   Note that the major and minor numbers &MUST; be treated as separate
1013   integers and that each &MAY; be incremented higher than a single digit.
1014   Thus, HTTP/2.4 is a lower version than HTTP/2.13, which in turn is
1015   lower than HTTP/12.3. Leading zeros &MUST; be ignored by recipients and
1016   &MUST-NOT; be sent.
1017</t>
1018<t>
1019   An application that sends a request or response message that includes
1020   HTTP-Version of "HTTP/1.1" &MUST; be at least conditionally compliant
1021   with this specification. Applications that are at least conditionally
1022   compliant with this specification &SHOULD; use an HTTP-Version of
1023   "HTTP/1.1" in their messages, and &MUST; do so for any message that is
1024   not compatible with HTTP/1.0. For more details on when to send
1025   specific HTTP-Version values, see <xref target="RFC2145"/>.
1026</t>
1027<t>
1028   The HTTP version of an application is the highest HTTP version for
1029   which the application is at least conditionally compliant.
1030</t>
1031<t>
1032   Proxy and gateway applications need to be careful when forwarding
1033   messages in protocol versions different from that of the application.
1034   Since the protocol version indicates the protocol capability of the
1035   sender, a proxy/gateway &MUST-NOT; send a message with a version
1036   indicator which is greater than its actual version. If a higher
1037   version request is received, the proxy/gateway &MUST; either downgrade
1038   the request version, or respond with an error, or switch to tunnel
1039   behavior.
1040</t>
1041<t>
1042   Due to interoperability problems with HTTP/1.0 proxies discovered
1043   since the publication of <xref target="RFC2068"/>, caching proxies &MUST;, gateways
1044   &MAY;, and tunnels &MUST-NOT; upgrade the request to the highest version
1045   they support. The proxy/gateway's response to that request &MUST; be in
1046   the same major version as the request.
1047</t>
1048<t>
1049  <list>
1050    <t>
1051      <x:h>Note:</x:h> Converting between versions of HTTP may involve modification
1052      of header fields required or forbidden by the versions involved.
1053    </t>
1054  </list>
1055</t>
1056</section>
1057
1058<section title="Uniform Resource Identifiers" anchor="uri">
1059<t>
1060   URIs have been known by many names: WWW addresses, Universal Document
1061   Identifiers, Universal Resource Identifiers <xref target="RFC1630"/>, and finally the
1062   combination of Uniform Resource Locators (URL) <xref target="RFC1738"/> and Names (URN)
1063   <xref target="RFC1737"/>. As far as HTTP is concerned, Uniform Resource Identifiers are
1064   simply formatted strings which identify--via name, location, or any
1065   other characteristic--a resource.
1066</t>
1067
1068<section title="General Syntax" anchor="general.syntax">
1069  <x:anchor-alias value="absoluteURI"/>
1070  <x:anchor-alias value="authority"/>
1071  <x:anchor-alias value="fragment"/>
1072  <x:anchor-alias value="path-absolute"/>
1073  <x:anchor-alias value="port"/>
1074  <x:anchor-alias value="query"/>
1075  <x:anchor-alias value="relativeURI"/>
1076  <x:anchor-alias value="uri-host"/>
1077<t>
1078   URIs in HTTP can be represented in absolute form or relative to some
1079   known base URI <xref target="RFC1808"/>, depending upon the context of their use. The two
1080   forms are differentiated by the fact that absolute URIs always begin
1081   with a scheme name followed by a colon. For definitive information on
1082   URL syntax and semantics, see "Uniform Resource Identifiers (URI):
1083   Generic Syntax and Semantics," <xref target="RFC2396"/> (which replaces <xref target="RFC1738"/>
1084   and <xref target="RFC1808"/>). This specification adopts the
1085   definitions of "URI-reference", "absoluteURI", "fragment", "relativeURI", "port",
1086   "host", "abs_path", "query", and "authority" from that specification:
1087</t>
1088<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="absoluteURI"/><iref primary="true" item="Grammar" subitem="authority"/><iref primary="true" item="Grammar" subitem="path-absolute"/><iref primary="true" item="Grammar" subitem="port"/><iref primary="true" item="Grammar" subitem="query"/><iref primary="true" item="Grammar" subitem="relativeURI"/><iref primary="true" item="Grammar" subitem="uri-host"/>
1089  <x:ref>absoluteURI</x:ref>   = &lt;absoluteURI, defined in <xref target="RFC2396" x:fmt="," x:sec="3"/>>
1090  <x:ref>authority</x:ref>     = &lt;authority, defined in <xref target="RFC2396" x:fmt="," x:sec="3.2"/>>
1091  <x:ref>fragment</x:ref>      = &lt;fragment, defined in <xref target="RFC2396" x:fmt="," x:sec="4.1"/>>
1092  <x:ref>path-absolute</x:ref> = &lt;abs_path, defined in <xref target="RFC2396" x:fmt="," x:sec="3"/>>
1093  <x:ref>port</x:ref>          = &lt;port, defined in <xref target="RFC2396" x:fmt="," x:sec="3.2.2"/>>
1094  <x:ref>query</x:ref>         = &lt;query, defined in <xref target="RFC2396" x:fmt="," x:sec="3.4"/>>
1095  <x:ref>relativeURI</x:ref>   = &lt;relativeURI, defined in <xref target="RFC2396" x:fmt="," x:sec="5"/>>
1096  <x:ref>uri-host</x:ref>      = &lt;host, defined in <xref target="RFC2396" x:fmt="," x:sec="3.2.2"/>>
1097</artwork></figure>
1098<t>
1099   HTTP does not place any a priori limit on the length of
1100   a URI. Servers &MUST; be able to handle the URI of any resource they
1101   serve, and &SHOULD; be able to handle URIs of unbounded length if they
1102   provide GET-based forms that could generate such URIs. A server
1103   &SHOULD; return 414 (Request-URI Too Long) status if a URI is longer
1104   than the server can handle (see &status-414;).
1105</t>
1106<t>
1107  <list>
1108    <t>
1109      <x:h>Note:</x:h> Servers ought to be cautious about depending on URI lengths
1110      above 255 bytes, because some older client or proxy
1111      implementations might not properly support these lengths.
1112    </t>
1113  </list>
1114</t>
1115</section>
1116
1117<section title="http URL" anchor="http.url">
1118  <x:anchor-alias value="http-URL"/>
1119<t>
1120   The "http" scheme is used to locate network resources via the HTTP
1121   protocol. This section defines the scheme-specific syntax and
1122   semantics for http URLs.
1123</t>
1124<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="http-URL"/>
1125  <x:ref>http-URL</x:ref> = "http:" "//" <x:ref>uri-host</x:ref> [ ":" <x:ref>port</x:ref> ]
1126             [ <x:ref>path-absolute</x:ref> [ "?" <x:ref>query</x:ref> ]]
1127</artwork></figure>
1128<t>
1129   If the port is empty or not given, port 80 is assumed. The semantics
1130   are that the identified resource is located at the server listening
1131   for TCP connections on that port of that host, and the Request-URI
1132   for the resource is path-absolute (<xref target="request-uri"/>). The use of IP addresses
1133   in URLs &SHOULD; be avoided whenever possible (see <xref target="RFC1900"/>). If
1134   the path-absolute is not present in the URL, it &MUST; be given as "/" when
1135   used as a Request-URI for a resource (<xref target="request-uri"/>). If a proxy
1136   receives a host name which is not a fully qualified domain name, it
1137   &MAY; add its domain to the host name it received. If a proxy receives
1138   a fully qualified domain name, the proxy &MUST-NOT; change the host
1139   name.
1140</t>
1141</section>
1142
1143<section title="URI Comparison" anchor="uri.comparison">
1144<t>
1145   When comparing two URIs to decide if they match or not, a client
1146   &SHOULD; use a case-sensitive octet-by-octet comparison of the entire
1147   URIs, with these exceptions:
1148  <list style="symbols">
1149    <t>A port that is empty or not given is equivalent to the default
1150        port for that URI-reference;</t>
1151    <t>Comparisons of host names &MUST; be case-insensitive;</t>
1152    <t>Comparisons of scheme names &MUST; be case-insensitive;</t>
1153    <t>An empty path-absolute is equivalent to an path-absolute of "/".</t>
1154  </list>
1155</t>
1156<t>
1157   Characters other than those in the "reserved" set (see
1158   <xref target="RFC2396"/>) are equivalent to their ""%" HEX HEX" encoding.
1159</t>
1160<t>
1161   For example, the following three URIs are equivalent:
1162</t>
1163<figure><artwork type="example">
1164   http://example.com:80/~smith/home.html
1165   http://EXAMPLE.com/%7Esmith/home.html
1166   http://EXAMPLE.com:/%7esmith/home.html
1167</artwork></figure>
1168</section>
1169</section>
1170
1171<section title="Date/Time Formats" anchor="date.time.formats">
1172<section title="Full Date" anchor="full.date">
1173  <x:anchor-alias value="HTTP-date"/>
1174  <x:anchor-alias value="obsolete-date"/>
1175  <x:anchor-alias value="rfc1123-date"/>
1176  <x:anchor-alias value="rfc850-date"/>
1177  <x:anchor-alias value="asctime-date"/>
1178  <x:anchor-alias value="date1"/>
1179  <x:anchor-alias value="date2"/>
1180  <x:anchor-alias value="date3"/>
1181  <x:anchor-alias value="rfc1123-date"/>
1182  <x:anchor-alias value="time"/>
1183  <x:anchor-alias value="wkday"/>
1184  <x:anchor-alias value="weekday"/>
1185  <x:anchor-alias value="month"/>
1186<t>
1187   HTTP applications have historically allowed three different formats
1188   for the representation of date/time stamps:
1189</t>
1190<figure><artwork type="example">
1191   Sun, 06 Nov 1994 08:49:37 GMT  ; RFC 822, updated by RFC 1123
1192   Sunday, 06-Nov-94 08:49:37 GMT ; obsolete RFC 850 format
1193   Sun Nov  6 08:49:37 1994       ; ANSI C's asctime() format
1194</artwork></figure>
1195<t>
1196   The first format is preferred as an Internet standard and represents
1197   a fixed-length subset of that defined by <xref target="RFC1123"/> (an update to
1198   <xref target="RFC822"/>). The other formats are described here only for
1199   compatibility with obsolete implementations.
1200   HTTP/1.1 clients and servers that parse the date value &MUST; accept
1201   all three formats (for compatibility with HTTP/1.0), though they &MUST;
1202   only generate the RFC 1123 format for representing HTTP-date values
1203   in header fields. See <xref target="tolerant.applications"/> for further information.
1204</t>
1205<t><list><t>
1206      <x:h>Note:</x:h> Recipients of date values are encouraged to be robust in
1207      accepting date values that may have been sent by non-HTTP
1208      applications, as is sometimes the case when retrieving or posting
1209      messages via proxies/gateways to SMTP or NNTP.
1210</t></list></t>
1211<t>
1212   All HTTP date/time stamps &MUST; be represented in Greenwich Mean Time
1213   (GMT), without exception. For the purposes of HTTP, GMT is exactly
1214   equal to UTC (Coordinated Universal Time). This is indicated in the
1215   first two formats by the inclusion of "GMT" as the three-letter
1216   abbreviation for time zone, and &MUST; be assumed when reading the
1217   asctime format. HTTP-date is case sensitive and &MUST-NOT; include
1218   additional LWS beyond that specifically included as SP in the
1219   grammar.
1220</t>
1221<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="HTTP-date"/><iref primary="true" item="Grammar" subitem="rfc1123-date"/><iref primary="true" item="Grammar" subitem="obsolete-date"/><iref primary="true" item="Grammar" subitem="rfc850-date"/><iref primary="true" item="Grammar" subitem="asctime-date"/><iref primary="true" item="Grammar" subitem="date1"/><iref primary="true" item="Grammar" subitem="date2"/><iref primary="true" item="Grammar" subitem="date3"/><iref primary="true" item="Grammar" subitem="time"/><iref primary="true" item="Grammar" subitem="wkday"/><iref primary="true" item="Grammar" subitem="weekday"/><iref primary="true" item="Grammar" subitem="month"/>
1222  <x:ref>HTTP-date</x:ref>    = <x:ref>rfc1123-date</x:ref> | <x:ref>obsolete-date</x:ref>
1223  <x:ref>obsolete-date</x:ref> = <x:ref>rfc850-date</x:ref> | <x:ref>asctime-date</x:ref> 
1224  <x:ref>rfc1123-date</x:ref> = <x:ref>wkday</x:ref> "," <x:ref>SP</x:ref> date1 <x:ref>SP</x:ref> time <x:ref>SP</x:ref> GMT
1225  <x:ref>rfc850-date</x:ref>  = <x:ref>weekday</x:ref> "," <x:ref>SP</x:ref> date2 <x:ref>SP</x:ref> time <x:ref>SP</x:ref> GMT
1226  <x:ref>asctime-date</x:ref> = <x:ref>wkday</x:ref> <x:ref>SP</x:ref> <x:ref>date3</x:ref> <x:ref>SP</x:ref> <x:ref>time</x:ref> <x:ref>SP</x:ref> 4<x:ref>DIGIT</x:ref>
1227  <x:ref>date1</x:ref>        = 2<x:ref>DIGIT</x:ref> <x:ref>SP</x:ref> <x:ref>month</x:ref> <x:ref>SP</x:ref> 4<x:ref>DIGIT</x:ref>
1228                 ; day month year (e.g., 02 Jun 1982)
1229  <x:ref>date2</x:ref>        = 2<x:ref>DIGIT</x:ref> "-" <x:ref>month</x:ref> "-" 2<x:ref>DIGIT</x:ref>
1230                 ; day-month-year (e.g., 02-Jun-82)
1231  <x:ref>date3</x:ref>        = <x:ref>month</x:ref> <x:ref>SP</x:ref> ( 2<x:ref>DIGIT</x:ref> | ( <x:ref>SP</x:ref> 1<x:ref>DIGIT</x:ref> ))
1232                 ; month day (e.g., Jun  2)
1233  <x:ref>time</x:ref>         = 2<x:ref>DIGIT</x:ref> ":" 2<x:ref>DIGIT</x:ref> ":" 2<x:ref>DIGIT</x:ref>
1234                 ; 00:00:00 - 23:59:59
1235  <x:ref>wkday</x:ref>        = s-Mon | s-Tue | s-Wed
1236               | s-Thu | s-Fri | s-Sat | s-Sun
1237  <x:ref>weekday</x:ref>      = l-Mon | l-Tue | l-Wed
1238               | l-Thu | l-Fri | l-Sat | l-Sun
1239  <x:ref>month</x:ref>        = s-Jan | s-Feb | s-Mar | s-Apr
1240               | s-May | s-Jun | s-Jul | s-Aug
1241               | s-Sep | s-Oct | s-Nov | s-Dec
1242               
1243  GMT   = <x:abnf-char-sequence>"GMT"</x:abnf-char-sequence> ; "GMT", case-sensitive
1244
1245  s-Mon = <x:abnf-char-sequence>"Mon"</x:abnf-char-sequence> ; "Mon", case-sensitive
1246  s-Tue = <x:abnf-char-sequence>"Tue"</x:abnf-char-sequence> ; "Tue", case-sensitive
1247  s-Wed = <x:abnf-char-sequence>"Wed"</x:abnf-char-sequence> ; "Wed", case-sensitive
1248  s-Thu = <x:abnf-char-sequence>"Thu"</x:abnf-char-sequence> ; "Thu", case-sensitive
1249  s-Fri = <x:abnf-char-sequence>"Fri"</x:abnf-char-sequence> ; "Fri", case-sensitive
1250  s-Sat = <x:abnf-char-sequence>"Sat"</x:abnf-char-sequence> ; "Sat", case-sensitive
1251  s-Sun = <x:abnf-char-sequence>"Sun"</x:abnf-char-sequence> ; "Sun", case-sensitive
1252
1253  l-Mon = <x:abnf-char-sequence>"Monday"</x:abnf-char-sequence>          ; "Monday", case-sensitive
1254  l-Tue = <x:abnf-char-sequence>"Tuesday"</x:abnf-char-sequence>       ; "Tuesday", case-sensitive
1255  l-Wed = <x:abnf-char-sequence>"Wednesday"</x:abnf-char-sequence> ; "Wednesday", case-sensitive
1256  l-Thu = <x:abnf-char-sequence>"Thursday"</x:abnf-char-sequence>    ; "Thursday", case-sensitive
1257  l-Fri = <x:abnf-char-sequence>"Friday"</x:abnf-char-sequence>          ; "Friday", case-sensitive
1258  l-Sat = <x:abnf-char-sequence>"Saturday"</x:abnf-char-sequence>    ; "Saturday", case-sensitive
1259  l-Sun = <x:abnf-char-sequence>"Sunday"</x:abnf-char-sequence>          ; "Sunday", case-sensitive
1260
1261  s-Jan = <x:abnf-char-sequence>"Jan"</x:abnf-char-sequence> ; "Jan", case-sensitive
1262  s-Feb = <x:abnf-char-sequence>"Feb"</x:abnf-char-sequence> ; "Feb", case-sensitive
1263  s-Mar = <x:abnf-char-sequence>"Mar"</x:abnf-char-sequence> ; "Mar", case-sensitive
1264  s-Apr = <x:abnf-char-sequence>"Apr"</x:abnf-char-sequence> ; "Apr", case-sensitive
1265  s-May = <x:abnf-char-sequence>"May"</x:abnf-char-sequence> ; "May", case-sensitive
1266  s-Jun = <x:abnf-char-sequence>"Jun"</x:abnf-char-sequence> ; "Jun", case-sensitive
1267  s-Jul = <x:abnf-char-sequence>"Jul"</x:abnf-char-sequence> ; "Jul", case-sensitive
1268  s-Aug = <x:abnf-char-sequence>"Aug"</x:abnf-char-sequence> ; "Aug", case-sensitive
1269  s-Sep = <x:abnf-char-sequence>"Sep"</x:abnf-char-sequence> ; "Sep", case-sensitive
1270  s-Oct = <x:abnf-char-sequence>"Oct"</x:abnf-char-sequence> ; "Oct", case-sensitive
1271  s-Nov = <x:abnf-char-sequence>"Nov"</x:abnf-char-sequence> ; "Nov", case-sensitive
1272  s-Dec = <x:abnf-char-sequence>"Dec"</x:abnf-char-sequence> ; "Dec", case-sensitive
1273</artwork></figure>
1274<t>
1275      <x:h>Note:</x:h> HTTP requirements for the date/time stamp format apply only
1276      to their usage within the protocol stream. Clients and servers are
1277      not required to use these formats for user presentation, request
1278      logging, etc.
1279</t>
1280</section>
1281</section>
1282
1283<section title="Transfer Codings" anchor="transfer.codings">
1284  <x:anchor-alias value="parameter"/>
1285  <x:anchor-alias value="transfer-coding"/>
1286  <x:anchor-alias value="transfer-extension"/>
1287<t>
1288   Transfer-coding values are used to indicate an encoding
1289   transformation that has been, can be, or may need to be applied to an
1290   entity-body in order to ensure "safe transport" through the network.
1291   This differs from a content coding in that the transfer-coding is a
1292   property of the message, not of the original entity.
1293</t>
1294<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="transfer-coding"/><iref primary="true" item="Grammar" subitem="transfer-extension"/>
1295  <x:ref>transfer-coding</x:ref>         = "chunked" | <x:ref>transfer-extension</x:ref>
1296  <x:ref>transfer-extension</x:ref>      = <x:ref>token</x:ref> *( ";" <x:ref>parameter</x:ref> )
1297</artwork></figure>
1298<t anchor="rule.parameter">
1299  <x:anchor-alias value="attribute"/>
1300  <x:anchor-alias value="parameter"/>
1301  <x:anchor-alias value="value"/>
1302   Parameters are in  the form of attribute/value pairs.
1303</t>
1304<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="parameter"/><iref primary="true" item="Grammar" subitem="attribute"/><iref primary="true" item="Grammar" subitem="value"/>
1305  <x:ref>parameter</x:ref>               = <x:ref>attribute</x:ref> "=" <x:ref>value</x:ref>
1306  <x:ref>attribute</x:ref>               = <x:ref>token</x:ref>
1307  <x:ref>value</x:ref>                   = <x:ref>token</x:ref> | <x:ref>quoted-string</x:ref>
1308</artwork></figure>
1309<t>
1310   All transfer-coding values are case-insensitive. HTTP/1.1 uses
1311   transfer-coding values in the TE header field (<xref target="header.te"/>) and in
1312   the Transfer-Encoding header field (<xref target="header.transfer-encoding"/>).
1313</t>
1314<t>
1315   Whenever a transfer-coding is applied to a message-body, the set of
1316   transfer-codings &MUST; include "chunked", unless the message is
1317   terminated by closing the connection. When the "chunked" transfer-coding
1318   is used, it &MUST; be the last transfer-coding applied to the
1319   message-body. The "chunked" transfer-coding &MUST-NOT; be applied more
1320   than once to a message-body. These rules allow the recipient to
1321   determine the transfer-length of the message (<xref target="message.length"/>).
1322</t>
1323<t>
1324   Transfer-codings are analogous to the Content-Transfer-Encoding
1325   values of MIME <xref target="RFC2045"/>, which were designed to enable safe transport of
1326   binary data over a 7-bit transport service. However, safe transport
1327   has a different focus for an 8bit-clean transfer protocol. In HTTP,
1328   the only unsafe characteristic of message-bodies is the difficulty in
1329   determining the exact body length (<xref target="message.length"/>), or the desire to
1330   encrypt data over a shared transport.
1331</t>
1332<t>
1333   The Internet Assigned Numbers Authority (IANA) acts as a registry for
1334   transfer-coding value tokens. Initially, the registry contains the
1335   following tokens: "chunked" (<xref target="chunked.transfer.encoding"/>),
1336   "gzip", "compress", and "deflate" (&content-codings;).
1337</t>
1338<t>
1339   New transfer-coding value tokens &SHOULD; be registered in the same way
1340   as new content-coding value tokens (&content-codings;).
1341</t>
1342<t>
1343   A server which receives an entity-body with a transfer-coding it does
1344   not understand &SHOULD; return 501 (Not Implemented), and close the
1345   connection. A server &MUST-NOT; send transfer-codings to an HTTP/1.0
1346   client.
1347</t>
1348
1349<section title="Chunked Transfer Coding" anchor="chunked.transfer.encoding">
1350  <x:anchor-alias value="chunk"/>
1351  <x:anchor-alias value="Chunked-Body"/>
1352  <x:anchor-alias value="chunk-data"/>
1353  <x:anchor-alias value="chunk-extension"/>
1354  <x:anchor-alias value="chunk-ext-name"/>
1355  <x:anchor-alias value="chunk-ext-val"/>
1356  <x:anchor-alias value="chunk-size"/>
1357  <x:anchor-alias value="last-chunk"/>
1358  <x:anchor-alias value="trailer-part"/>
1359<t>
1360   The chunked encoding modifies the body of a message in order to
1361   transfer it as a series of chunks, each with its own size indicator,
1362   followed by an &OPTIONAL; trailer containing entity-header fields. This
1363   allows dynamically produced content to be transferred along with the
1364   information necessary for the recipient to verify that it has
1365   received the full message.
1366</t>
1367<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Chunked-Body"/><iref primary="true" item="Grammar" subitem="chunk"/><iref primary="true" item="Grammar" subitem="chunk-size"/><iref primary="true" item="Grammar" subitem="last-chunk"/><iref primary="true" item="Grammar" subitem="chunk-extension"/><iref primary="true" item="Grammar" subitem="chunk-ext-name"/><iref primary="true" item="Grammar" subitem="chunk-ext-val"/><iref primary="true" item="Grammar" subitem="chunk-data"/><iref primary="true" item="Grammar" subitem="trailer-part"/>
1368  <x:ref>Chunked-Body</x:ref>   = *<x:ref>chunk</x:ref>
1369                   <x:ref>last-chunk</x:ref>
1370                   <x:ref>trailer-part</x:ref>
1371                   <x:ref>CRLF</x:ref>
1372 
1373  <x:ref>chunk</x:ref>          = <x:ref>chunk-size</x:ref> [ <x:ref>chunk-extension</x:ref> ] <x:ref>CRLF</x:ref>
1374                   <x:ref>chunk-data</x:ref> <x:ref>CRLF</x:ref>
1375  <x:ref>chunk-size</x:ref>     = 1*<x:ref>HEX</x:ref>
1376  <x:ref>last-chunk</x:ref>     = 1*("0") [ <x:ref>chunk-extension</x:ref> ] <x:ref>CRLF</x:ref>
1377 
1378  <x:ref>chunk-extension</x:ref>= *( ";" <x:ref>chunk-ext-name</x:ref> [ "=" <x:ref>chunk-ext-val</x:ref> ] )
1379  <x:ref>chunk-ext-name</x:ref> = <x:ref>token</x:ref>
1380  <x:ref>chunk-ext-val</x:ref>  = <x:ref>token</x:ref> | <x:ref>quoted-string</x:ref>
1381  <x:ref>chunk-data</x:ref>     = 1*<x:ref>OCTET</x:ref> ; a sequence of chunk-size octets
1382  <x:ref>trailer-part</x:ref>   = *(<x:ref>entity-header</x:ref> <x:ref>CRLF</x:ref>)
1383</artwork></figure>
1384<t>
1385   The chunk-size field is a string of hex digits indicating the size of
1386   the chunk-data in octets. The chunked encoding is ended by any chunk whose size is
1387   zero, followed by the trailer, which is terminated by an empty line.
1388</t>
1389<t>
1390   The trailer allows the sender to include additional HTTP header
1391   fields at the end of the message. The Trailer header field can be
1392   used to indicate which header fields are included in a trailer (see
1393   <xref target="header.trailer"/>).
1394</t>
1395<t>
1396   A server using chunked transfer-coding in a response &MUST-NOT; use the
1397   trailer for any header fields unless at least one of the following is
1398   true:
1399  <list style="numbers">
1400    <t>the request included a TE header field that indicates "trailers" is
1401     acceptable in the transfer-coding of the  response, as described in
1402     <xref target="header.te"/>; or,</t>
1403
1404    <t>the server is the origin server for the response, the trailer
1405     fields consist entirely of optional metadata, and the recipient
1406     could use the message (in a manner acceptable to the origin server)
1407     without receiving this metadata.  In other words, the origin server
1408     is willing to accept the possibility that the trailer fields might
1409     be silently discarded along the path to the client.</t>
1410  </list>
1411</t>
1412<t>
1413   This requirement prevents an interoperability failure when the
1414   message is being received by an HTTP/1.1 (or later) proxy and
1415   forwarded to an HTTP/1.0 recipient. It avoids a situation where
1416   compliance with the protocol would have necessitated a possibly
1417   infinite buffer on the proxy.
1418</t>
1419<t>
1420   A process for decoding the "chunked" transfer-coding
1421   can be represented in pseudo-code as:
1422</t>
1423<figure><artwork type="code">
1424    length := 0
1425    read chunk-size, chunk-extension (if any) and CRLF
1426    while (chunk-size &gt; 0) {
1427       read chunk-data and CRLF
1428       append chunk-data to entity-body
1429       length := length + chunk-size
1430       read chunk-size and CRLF
1431    }
1432    read entity-header
1433    while (entity-header not empty) {
1434       append entity-header to existing header fields
1435       read entity-header
1436    }
1437    Content-Length := length
1438    Remove "chunked" from Transfer-Encoding
1439</artwork></figure>
1440<t>
1441   All HTTP/1.1 applications &MUST; be able to receive and decode the
1442   "chunked" transfer-coding, and &MUST; ignore chunk-extension extensions
1443   they do not understand.
1444</t>
1445</section>
1446</section>
1447
1448<section title="Product Tokens" anchor="product.tokens">
1449  <x:anchor-alias value="product"/>
1450  <x:anchor-alias value="product-version"/>
1451<t>
1452   Product tokens are used to allow communicating applications to
1453   identify themselves by software name and version. Most fields using
1454   product tokens also allow sub-products which form a significant part
1455   of the application to be listed, separated by white space. By
1456   convention, the products are listed in order of their significance
1457   for identifying the application.
1458</t>
1459<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="product"/><iref primary="true" item="Grammar" subitem="product-version"/>
1460  <x:ref>product</x:ref>         = <x:ref>token</x:ref> ["/" <x:ref>product-version</x:ref>]
1461  <x:ref>product-version</x:ref> = <x:ref>token</x:ref>
1462</artwork></figure>
1463<t>
1464   Examples:
1465</t>
1466<figure><artwork type="example">
1467    User-Agent: CERN-LineMode/2.15 libwww/2.17b3
1468    Server: Apache/0.8.4
1469</artwork></figure>
1470<t>
1471   Product tokens &SHOULD; be short and to the point. They &MUST-NOT; be
1472   used for advertising or other non-essential information. Although any
1473   token character &MAY; appear in a product-version, this token &SHOULD;
1474   only be used for a version identifier (i.e., successive versions of
1475   the same product &SHOULD; only differ in the product-version portion of
1476   the product value).
1477</t>
1478</section>
1479
1480</section>
1481
1482<section title="HTTP Message" anchor="http.message">
1483
1484<section title="Message Types" anchor="message.types">
1485  <x:anchor-alias value="generic-message"/>
1486  <x:anchor-alias value="HTTP-message"/>
1487  <x:anchor-alias value="start-line"/>
1488<t>
1489   HTTP messages consist of requests from client to server and responses
1490   from server to client.
1491</t>
1492<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="HTTP-message"/>
1493  <x:ref>HTTP-message</x:ref>   = <x:ref>Request</x:ref> | <x:ref>Response</x:ref>     ; HTTP/1.1 messages
1494</artwork></figure>
1495<t>
1496   Request (<xref target="request"/>) and Response (<xref target="response"/>) messages use the generic
1497   message format of <xref target="RFC2822"/> for transferring entities (the payload
1498   of the message). Both types of message consist of a start-line, zero
1499   or more header fields (also known as "headers"), an empty line (i.e.,
1500   a line with nothing preceding the CRLF) indicating the end of the
1501   header fields, and possibly a message-body.
1502</t>
1503<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="generic-message"/><iref primary="true" item="Grammar" subitem="start-line"/>
1504  <x:ref>generic-message</x:ref> = <x:ref>start-line</x:ref>
1505                    *(<x:ref>message-header</x:ref> <x:ref>CRLF</x:ref>)
1506                    <x:ref>CRLF</x:ref>
1507                    [ <x:ref>message-body</x:ref> ]
1508  <x:ref>start-line</x:ref>      = <x:ref>Request-Line</x:ref> | <x:ref>Status-Line</x:ref>
1509</artwork></figure>
1510<t>
1511   In the interest of robustness, servers &SHOULD; ignore any empty
1512   line(s) received where a Request-Line is expected. In other words, if
1513   the server is reading the protocol stream at the beginning of a
1514   message and receives a CRLF first, it should ignore the CRLF.
1515</t>
1516<t>
1517   Certain buggy HTTP/1.0 client implementations generate extra CRLF's
1518   after a POST request. To restate what is explicitly forbidden by the
1519   BNF, an HTTP/1.1 client &MUST-NOT; preface or follow a request with an
1520   extra CRLF.
1521</t>
1522</section>
1523
1524<section title="Message Headers" anchor="message.headers">
1525  <x:anchor-alias value="field-content"/>
1526  <x:anchor-alias value="field-name"/>
1527  <x:anchor-alias value="field-value"/>
1528  <x:anchor-alias value="message-header"/>
1529<t>
1530   HTTP header fields, which include general-header (<xref target="general.header.fields"/>),
1531   request-header (&request-header-fields;), response-header (&response-header-fields;), and
1532   entity-header (&entity-header-fields;) fields, follow the same generic format as
1533   that given in <xref target="RFC2822" x:fmt="of" x:sec="2.1"/>. Each header field consists
1534   of a name followed by a colon (":") and the field value. Field names
1535   are case-insensitive. The field value &MAY; be preceded by any amount
1536   of LWS, though a single SP is preferred. Header fields can be
1537   extended over multiple lines by preceding each extra line with at
1538   least one SP or HTAB. Applications ought to follow "common form", where
1539   one is known or indicated, when generating HTTP constructs, since
1540   there might exist some implementations that fail to accept anything
1541   beyond the common forms.
1542</t>
1543<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="message-header"/><iref primary="true" item="Grammar" subitem="field-name"/><iref primary="true" item="Grammar" subitem="field-value"/><iref primary="true" item="Grammar" subitem="field-content"/>
1544  <x:ref>message-header</x:ref> = <x:ref>field-name</x:ref> ":" [ <x:ref>field-value</x:ref> ]
1545  <x:ref>field-name</x:ref>     = <x:ref>token</x:ref>
1546  <x:ref>field-value</x:ref>    = *( <x:ref>field-content</x:ref> | <x:ref>LWS</x:ref> )
1547  <x:ref>field-content</x:ref>  = &lt;field content&gt;
1548                   ; the <x:ref>OCTET</x:ref>s making up the field-value
1549                   ; and consisting of either *<x:ref>TEXT</x:ref> or combinations
1550                   ; of <x:ref>token</x:ref>, <x:ref>separators</x:ref>, and <x:ref>quoted-string</x:ref>
1551</artwork></figure>
1552<t>
1553   The field-content does not include any leading or trailing LWS:
1554   linear white space occurring before the first non-whitespace
1555   character of the field-value or after the last non-whitespace
1556   character of the field-value. Such leading or trailing LWS &MAY; be
1557   removed without changing the semantics of the field value. Any LWS
1558   that occurs between field-content &MAY; be replaced with a single SP
1559   before interpreting the field value or forwarding the message
1560   downstream.
1561</t>
1562<t>
1563   The order in which header fields with differing field names are
1564   received is not significant. However, it is "good practice" to send
1565   general-header fields first, followed by request-header or response-header
1566   fields, and ending with the entity-header fields.
1567</t>
1568<t>
1569   Multiple message-header fields with the same field-name &MAY; be
1570   present in a message if and only if the entire field-value for that
1571   header field is defined as a comma-separated list [i.e., #(values)].
1572   It &MUST; be possible to combine the multiple header fields into one
1573   "field-name: field-value" pair, without changing the semantics of the
1574   message, by appending each subsequent field-value to the first, each
1575   separated by a comma. The order in which header fields with the same
1576   field-name are received is therefore significant to the
1577   interpretation of the combined field value, and thus a proxy &MUST-NOT;
1578   change the order of these field values when a message is forwarded.
1579</t>
1580</section>
1581
1582<section title="Message Body" anchor="message.body">
1583  <x:anchor-alias value="message-body"/>
1584<t>
1585   The message-body (if any) of an HTTP message is used to carry the
1586   entity-body associated with the request or response. The message-body
1587   differs from the entity-body only when a transfer-coding has been
1588   applied, as indicated by the Transfer-Encoding header field (<xref target="header.transfer-encoding"/>).
1589</t>
1590<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="message-body"/>
1591  <x:ref>message-body</x:ref> = <x:ref>entity-body</x:ref>
1592               | &lt;entity-body encoded as per <x:ref>Transfer-Encoding</x:ref>&gt;
1593</artwork></figure>
1594<t>
1595   Transfer-Encoding &MUST; be used to indicate any transfer-codings
1596   applied by an application to ensure safe and proper transfer of the
1597   message. Transfer-Encoding is a property of the message, not of the
1598   entity, and thus &MAY; be added or removed by any application along the
1599   request/response chain. (However, <xref target="transfer.codings"/> places restrictions on
1600   when certain transfer-codings may be used.)
1601</t>
1602<t>
1603   The rules for when a message-body is allowed in a message differ for
1604   requests and responses.
1605</t>
1606<t>
1607   The presence of a message-body in a request is signaled by the
1608   inclusion of a Content-Length or Transfer-Encoding header field in
1609   the request's message-headers. A message-body &MUST-NOT; be included in
1610   a request if the specification of the request method (&method;)
1611   explicitly disallows an entity-body in requests.
1612   When a request message contains both a message-body of non-zero
1613   length and a method that does not define any semantics for that
1614   request message-body, then an origin server &SHOULD; either ignore
1615   the message-body or respond with an appropriate error message
1616   (e.g., 413).  A proxy or gateway, when presented the same request,
1617   &SHOULD; either forward the request inbound with the message-body or
1618   ignore the message-body when determining a response.
1619</t>
1620<t>
1621   For response messages, whether or not a message-body is included with
1622   a message is dependent on both the request method and the response
1623   status code (<xref target="status.code.and.reason.phrase"/>). All responses to the HEAD request method
1624   &MUST-NOT; include a message-body, even though the presence of entity-header
1625   fields might lead one to believe they do. All 1xx
1626   (informational), 204 (No Content), and 304 (Not Modified) responses
1627   &MUST-NOT; include a message-body. All other responses do include a
1628   message-body, although it &MAY; be of zero length.
1629</t>
1630</section>
1631
1632<section title="Message Length" anchor="message.length">
1633<t>
1634   The transfer-length of a message is the length of the message-body as
1635   it appears in the message; that is, after any transfer-codings have
1636   been applied. When a message-body is included with a message, the
1637   transfer-length of that body is determined by one of the following
1638   (in order of precedence):
1639</t>
1640<t>
1641  <list style="numbers">
1642    <x:lt><t>
1643     Any response message which "&MUST-NOT;" include a message-body (such
1644     as the 1xx, 204, and 304 responses and any response to a HEAD
1645     request) is always terminated by the first empty line after the
1646     header fields, regardless of the entity-header fields present in
1647     the message.
1648    </t></x:lt>
1649    <x:lt><t>
1650     If a Transfer-Encoding header field (<xref target="header.transfer-encoding"/>)
1651     is present, then the transfer-length is
1652     defined by use of the "chunked" transfer-coding (<xref target="transfer.codings"/>),
1653     unless the message is terminated by closing the connection.
1654    </t></x:lt>
1655    <x:lt><t>
1656     If a Content-Length header field (<xref target="header.content-length"/>) is present, its
1657     decimal value in OCTETs represents both the entity-length and the
1658     transfer-length. The Content-Length header field &MUST-NOT; be sent
1659     if these two lengths are different (i.e., if a Transfer-Encoding
1660     header field is present). If a message is received with both a
1661     Transfer-Encoding header field and a Content-Length header field,
1662     the latter &MUST; be ignored.
1663    </t></x:lt>
1664    <x:lt><t>
1665     If the message uses the media type "multipart/byteranges", and the
1666     transfer-length is not otherwise specified, then this self-delimiting
1667     media type defines the transfer-length. This media type
1668     &MUST-NOT; be used unless the sender knows that the recipient can parse
1669     it; the presence in a request of a Range header with multiple byte-range
1670     specifiers from a 1.1 client implies that the client can parse
1671     multipart/byteranges responses.
1672    <list style="empty"><t>
1673       A range header might be forwarded by a 1.0 proxy that does not
1674       understand multipart/byteranges; in this case the server &MUST;
1675       delimit the message using methods defined in items 1, 3 or 5 of
1676       this section.
1677    </t></list>
1678    </t></x:lt>
1679    <x:lt><t>
1680     By the server closing the connection. (Closing the connection
1681     cannot be used to indicate the end of a request body, since that
1682     would leave no possibility for the server to send back a response.)
1683    </t></x:lt>
1684  </list>
1685</t>
1686<t>
1687   For compatibility with HTTP/1.0 applications, HTTP/1.1 requests
1688   containing a message-body &MUST; include a valid Content-Length header
1689   field unless the server is known to be HTTP/1.1 compliant. If a
1690   request contains a message-body and a Content-Length is not given,
1691   the server &SHOULD; respond with 400 (Bad Request) if it cannot
1692   determine the length of the message, or with 411 (Length Required) if
1693   it wishes to insist on receiving a valid Content-Length.
1694</t>
1695<t>
1696   All HTTP/1.1 applications that receive entities &MUST; accept the
1697   "chunked" transfer-coding (<xref target="transfer.codings"/>), thus allowing this mechanism
1698   to be used for messages when the message length cannot be determined
1699   in advance.
1700</t>
1701<t>
1702   Messages &MUST-NOT; include both a Content-Length header field and a
1703   transfer-coding. If the message does include a
1704   transfer-coding, the Content-Length &MUST; be ignored.
1705</t>
1706<t>
1707   When a Content-Length is given in a message where a message-body is
1708   allowed, its field value &MUST; exactly match the number of OCTETs in
1709   the message-body. HTTP/1.1 user agents &MUST; notify the user when an
1710   invalid length is received and detected.
1711</t>
1712</section>
1713
1714<section title="General Header Fields" anchor="general.header.fields">
1715  <x:anchor-alias value="general-header"/>
1716<t>
1717   There are a few header fields which have general applicability for
1718   both request and response messages, but which do not apply to the
1719   entity being transferred. These header fields apply only to the
1720   message being transmitted.
1721</t>
1722<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="general-header"/>
1723  <x:ref>general-header</x:ref> = <x:ref>Cache-Control</x:ref>            ; &header-cache-control;
1724                 | <x:ref>Connection</x:ref>               ; <xref target="header.connection"/>
1725                 | <x:ref>Date</x:ref>                     ; <xref target="header.date"/>
1726                 | <x:ref>Pragma</x:ref>                   ; &header-pragma;
1727                 | <x:ref>Trailer</x:ref>                  ; <xref target="header.trailer"/>
1728                 | <x:ref>Transfer-Encoding</x:ref>        ; <xref target="header.transfer-encoding"/>
1729                 | <x:ref>Upgrade</x:ref>                  ; <xref target="header.upgrade"/>
1730                 | <x:ref>Via</x:ref>                      ; <xref target="header.via"/>
1731                 | <x:ref>Warning</x:ref>                  ; &header-warning;
1732</artwork></figure>
1733<t>
1734   General-header field names can be extended reliably only in
1735   combination with a change in the protocol version. However, new or
1736   experimental header fields may be given the semantics of general
1737   header fields if all parties in the communication recognize them to
1738   be general-header fields. Unrecognized header fields are treated as
1739   entity-header fields.
1740</t>
1741</section>
1742</section>
1743
1744<section title="Request" anchor="request">
1745  <x:anchor-alias value="Request"/>
1746<t>
1747   A request message from a client to a server includes, within the
1748   first line of that message, the method to be applied to the resource,
1749   the identifier of the resource, and the protocol version in use.
1750</t>
1751<!--                 Host                      ; should be moved here eventually -->
1752<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Request"/>
1753  <x:ref>Request</x:ref>       = <x:ref>Request-Line</x:ref>              ; <xref target="request-line"/>
1754                  *(( <x:ref>general-header</x:ref>        ; <xref target="general.header.fields"/>
1755                   | <x:ref>request-header</x:ref>         ; &request-header-fields;
1756                   | <x:ref>entity-header</x:ref> ) <x:ref>CRLF</x:ref>)  ; &entity-header-fields;
1757                  <x:ref>CRLF</x:ref>
1758                  [ <x:ref>message-body</x:ref> ]          ; <xref target="message.body"/>
1759</artwork></figure>
1760
1761<section title="Request-Line" anchor="request-line">
1762  <x:anchor-alias value="Request-Line"/>
1763<t>
1764   The Request-Line begins with a method token, followed by the
1765   Request-URI and the protocol version, and ending with CRLF. The
1766   elements are separated by SP characters. No CR or LF is allowed
1767   except in the final CRLF sequence.
1768</t>
1769<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Request-Line"/>
1770  <x:ref>Request-Line</x:ref>   = <x:ref>Method</x:ref> <x:ref>SP</x:ref> <x:ref>Request-URI</x:ref> <x:ref>SP</x:ref> <x:ref>HTTP-Version</x:ref> <x:ref>CRLF</x:ref>
1771</artwork></figure>
1772
1773<section title="Method" anchor="method">
1774  <x:anchor-alias value="Method"/>
1775<t>
1776   The Method  token indicates the method to be performed on the
1777   resource identified by the Request-URI. The method is case-sensitive.
1778</t>
1779<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Method"/><iref primary="true" item="Grammar" subitem="extension-method"/>
1780  <x:ref>Method</x:ref>         = <x:ref>token</x:ref>
1781</artwork></figure>
1782</section>
1783
1784<section title="Request-URI" anchor="request-uri">
1785  <x:anchor-alias value="Request-URI"/>
1786<t>
1787   The Request-URI is a Uniform Resource Identifier (<xref target="uri"/>) and
1788   identifies the resource upon which to apply the request.
1789</t>
1790<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Request-URI"/>
1791  <x:ref>Request-URI</x:ref>    = "*"
1792                 | <x:ref>absoluteURI</x:ref>
1793                 | ( <x:ref>path-absolute</x:ref> [ "?" <x:ref>query</x:ref> ] )
1794                 | <x:ref>authority</x:ref>
1795</artwork></figure>
1796<t>
1797   The four options for Request-URI are dependent on the nature of the
1798   request. The asterisk "*" means that the request does not apply to a
1799   particular resource, but to the server itself, and is only allowed
1800   when the method used does not necessarily apply to a resource. One
1801   example would be
1802</t>
1803<figure><artwork type="example">
1804    OPTIONS * HTTP/1.1
1805</artwork></figure>
1806<t>
1807   The absoluteURI form is &REQUIRED; when the request is being made to a
1808   proxy. The proxy is requested to forward the request or service it
1809   from a valid cache, and return the response. Note that the proxy &MAY;
1810   forward the request on to another proxy or directly to the server
1811   specified by the absoluteURI. In order to avoid request loops, a
1812   proxy &MUST; be able to recognize all of its server names, including
1813   any aliases, local variations, and the numeric IP address. An example
1814   Request-Line would be:
1815</t>
1816<figure><artwork type="example">
1817    GET http://www.example.org/pub/WWW/TheProject.html HTTP/1.1
1818</artwork></figure>
1819<t>
1820   To allow for transition to absoluteURIs in all requests in future
1821   versions of HTTP, all HTTP/1.1 servers &MUST; accept the absoluteURI
1822   form in requests, even though HTTP/1.1 clients will only generate
1823   them in requests to proxies.
1824</t>
1825<t>
1826   The authority form is only used by the CONNECT method (&CONNECT;).
1827</t>
1828<t>
1829   The most common form of Request-URI is that used to identify a
1830   resource on an origin server or gateway. In this case the absolute
1831   path of the URI &MUST; be transmitted (see <xref target="general.syntax"/>, path-absolute) as
1832   the Request-URI, and the network location of the URI (authority) &MUST;
1833   be transmitted in a Host header field. For example, a client wishing
1834   to retrieve the resource above directly from the origin server would
1835   create a TCP connection to port 80 of the host "www.example.org" and send
1836   the lines:
1837</t>
1838<figure><artwork type="example">
1839    GET /pub/WWW/TheProject.html HTTP/1.1
1840    Host: www.example.org
1841</artwork></figure>
1842<t>
1843   followed by the remainder of the Request. Note that the absolute path
1844   cannot be empty; if none is present in the original URI, it &MUST; be
1845   given as "/" (the server root).
1846</t>
1847<t>
1848   The Request-URI is transmitted in the format specified in
1849   <xref target="general.syntax"/>. If the Request-URI is encoded using the "% HEX HEX" encoding
1850   <xref target="RFC2396"/>, the origin server &MUST; decode the Request-URI in order to
1851   properly interpret the request. Servers &SHOULD; respond to invalid
1852   Request-URIs with an appropriate status code.
1853</t>
1854<t>
1855   A transparent proxy &MUST-NOT; rewrite the "path-absolute" part of the
1856   received Request-URI when forwarding it to the next inbound server,
1857   except as noted above to replace a null path-absolute with "/".
1858</t>
1859<t>
1860  <list><t>
1861      <x:h>Note:</x:h> The "no rewrite" rule prevents the proxy from changing the
1862      meaning of the request when the origin server is improperly using
1863      a non-reserved URI character for a reserved purpose.  Implementors
1864      should be aware that some pre-HTTP/1.1 proxies have been known to
1865      rewrite the Request-URI.
1866  </t></list>
1867</t>
1868</section>
1869</section>
1870
1871<section title="The Resource Identified by a Request" anchor="the.resource.identified.by.a.request">
1872<t>
1873   The exact resource identified by an Internet request is determined by
1874   examining both the Request-URI and the Host header field.
1875</t>
1876<t>
1877   An origin server that does not allow resources to differ by the
1878   requested host &MAY; ignore the Host header field value when
1879   determining the resource identified by an HTTP/1.1 request. (But see
1880   <xref target="changes.to.simplify.multi-homed.web.servers.and.conserve.ip.addresses"/>
1881   for other requirements on Host support in HTTP/1.1.)
1882</t>
1883<t>
1884   An origin server that does differentiate resources based on the host
1885   requested (sometimes referred to as virtual hosts or vanity host
1886   names) &MUST; use the following rules for determining the requested
1887   resource on an HTTP/1.1 request:
1888  <list style="numbers">
1889    <t>If Request-URI is an absoluteURI, the host is part of the
1890     Request-URI. Any Host header field value in the request &MUST; be
1891     ignored.</t>
1892    <t>If the Request-URI is not an absoluteURI, and the request includes
1893     a Host header field, the host is determined by the Host header
1894     field value.</t>
1895    <t>If the host as determined by rule 1 or 2 is not a valid host on
1896     the server, the response &MUST; be a 400 (Bad Request) error message.</t>
1897  </list>
1898</t>
1899<t>
1900   Recipients of an HTTP/1.0 request that lacks a Host header field &MAY;
1901   attempt to use heuristics (e.g., examination of the URI path for
1902   something unique to a particular host) in order to determine what
1903   exact resource is being requested.
1904</t>
1905</section>
1906
1907</section>
1908
1909
1910<section title="Response" anchor="response">
1911  <x:anchor-alias value="Response"/>
1912<t>
1913   After receiving and interpreting a request message, a server responds
1914   with an HTTP response message.
1915</t>
1916<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Response"/>
1917  <x:ref>Response</x:ref>      = <x:ref>Status-Line</x:ref>               ; <xref target="status-line"/>
1918                  *(( <x:ref>general-header</x:ref>        ; <xref target="general.header.fields"/>
1919                   | <x:ref>response-header</x:ref>        ; &response-header-fields;
1920                   | <x:ref>entity-header</x:ref> ) <x:ref>CRLF</x:ref>)  ; &entity-header-fields;
1921                  <x:ref>CRLF</x:ref>
1922                  [ <x:ref>message-body</x:ref> ]          ; <xref target="message.body"/>
1923</artwork></figure>
1924
1925<section title="Status-Line" anchor="status-line">
1926  <x:anchor-alias value="Status-Line"/>
1927<t>
1928   The first line of a Response message is the Status-Line, consisting
1929   of the protocol version followed by a numeric status code and its
1930   associated textual phrase, with each element separated by SP
1931   characters. No CR or LF is allowed except in the final CRLF sequence.
1932</t>
1933<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Status-Line"/>
1934  <x:ref>Status-Line</x:ref> = <x:ref>HTTP-Version</x:ref> <x:ref>SP</x:ref> <x:ref>Status-Code</x:ref> <x:ref>SP</x:ref> <x:ref>Reason-Phrase</x:ref> <x:ref>CRLF</x:ref>
1935</artwork></figure>
1936
1937<section title="Status Code and Reason Phrase" anchor="status.code.and.reason.phrase">
1938  <x:anchor-alias value="Reason-Phrase"/>
1939  <x:anchor-alias value="Status-Code"/>
1940<t>
1941   The Status-Code element is a 3-digit integer result code of the
1942   attempt to understand and satisfy the request. These codes are fully
1943   defined in &status-codes;.  The Reason Phrase exists for the sole
1944   purpose of providing a textual description associated with the numeric
1945   status code, out of deference to earlier Internet application protocols
1946   that were more frequently used with interactive text clients.
1947   A client &SHOULD; ignore the content of the Reason Phrase.
1948</t>
1949<t>
1950   The first digit of the Status-Code defines the class of response. The
1951   last two digits do not have any categorization role. There are 5
1952   values for the first digit:
1953  <list style="symbols">
1954    <t>
1955      1xx: Informational - Request received, continuing process
1956    </t>
1957    <t>
1958      2xx: Success - The action was successfully received,
1959        understood, and accepted
1960    </t>
1961    <t>
1962      3xx: Redirection - Further action must be taken in order to
1963        complete the request
1964    </t>
1965    <t>
1966      4xx: Client Error - The request contains bad syntax or cannot
1967        be fulfilled
1968    </t>
1969    <t>
1970      5xx: Server Error - The server failed to fulfill an apparently
1971        valid request
1972    </t>
1973  </list>
1974</t>
1975<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Status-Code"/><iref primary="true" item="Grammar" subitem="extension-code"/><iref primary="true" item="Grammar" subitem="Reason-Phrase"/>
1976  <x:ref>Status-Code</x:ref>    = 3<x:ref>DIGIT</x:ref>
1977  <x:ref>Reason-Phrase</x:ref>  = *&lt;<x:ref>TEXT</x:ref>, excluding <x:ref>CR</x:ref>, <x:ref>LF</x:ref>&gt;
1978</artwork></figure>
1979</section>
1980</section>
1981
1982</section>
1983
1984
1985<section title="Connections" anchor="connections">
1986
1987<section title="Persistent Connections" anchor="persistent.connections">
1988
1989<section title="Purpose" anchor="persistent.purpose">
1990<t>
1991   Prior to persistent connections, a separate TCP connection was
1992   established to fetch each URL, increasing the load on HTTP servers
1993   and causing congestion on the Internet. The use of inline images and
1994   other associated data often require a client to make multiple
1995   requests of the same server in a short amount of time. Analysis of
1996   these performance problems and results from a prototype
1997   implementation are available <xref target="Pad1995"/> <xref target="Spe"/>. Implementation experience and
1998   measurements of actual HTTP/1.1 (<xref target="RFC2068" x:fmt="none">RFC 2068</xref>) implementations show good
1999   results <xref target="Nie1997"/>. Alternatives have also been explored, for example,
2000   T/TCP <xref target="Tou1998"/>.
2001</t>
2002<t>
2003   Persistent HTTP connections have a number of advantages:
2004  <list style="symbols">
2005      <t>
2006        By opening and closing fewer TCP connections, CPU time is saved
2007        in routers and hosts (clients, servers, proxies, gateways,
2008        tunnels, or caches), and memory used for TCP protocol control
2009        blocks can be saved in hosts.
2010      </t>
2011      <t>
2012        HTTP requests and responses can be pipelined on a connection.
2013        Pipelining allows a client to make multiple requests without
2014        waiting for each response, allowing a single TCP connection to
2015        be used much more efficiently, with much lower elapsed time.
2016      </t>
2017      <t>
2018        Network congestion is reduced by reducing the number of packets
2019        caused by TCP opens, and by allowing TCP sufficient time to
2020        determine the congestion state of the network.
2021      </t>
2022      <t>
2023        Latency on subsequent requests is reduced since there is no time
2024        spent in TCP's connection opening handshake.
2025      </t>
2026      <t>
2027        HTTP can evolve more gracefully, since errors can be reported
2028        without the penalty of closing the TCP connection. Clients using
2029        future versions of HTTP might optimistically try a new feature,
2030        but if communicating with an older server, retry with old
2031        semantics after an error is reported.
2032      </t>
2033    </list>
2034</t>
2035<t>
2036   HTTP implementations &SHOULD; implement persistent connections.
2037</t>
2038</section>
2039
2040<section title="Overall Operation" anchor="persistent.overall">
2041<t>
2042   A significant difference between HTTP/1.1 and earlier versions of
2043   HTTP is that persistent connections are the default behavior of any
2044   HTTP connection. That is, unless otherwise indicated, the client
2045   &SHOULD; assume that the server will maintain a persistent connection,
2046   even after error responses from the server.
2047</t>
2048<t>
2049   Persistent connections provide a mechanism by which a client and a
2050   server can signal the close of a TCP connection. This signaling takes
2051   place using the Connection header field (<xref target="header.connection"/>). Once a close
2052   has been signaled, the client &MUST-NOT; send any more requests on that
2053   connection.
2054</t>
2055
2056<section title="Negotiation" anchor="persistent.negotiation">
2057<t>
2058   An HTTP/1.1 server &MAY; assume that a HTTP/1.1 client intends to
2059   maintain a persistent connection unless a Connection header including
2060   the connection-token "close" was sent in the request. If the server
2061   chooses to close the connection immediately after sending the
2062   response, it &SHOULD; send a Connection header including the
2063   connection-token close.
2064</t>
2065<t>
2066   An HTTP/1.1 client &MAY; expect a connection to remain open, but would
2067   decide to keep it open based on whether the response from a server
2068   contains a Connection header with the connection-token close. In case
2069   the client does not want to maintain a connection for more than that
2070   request, it &SHOULD; send a Connection header including the
2071   connection-token close.
2072</t>
2073<t>
2074   If either the client or the server sends the close token in the
2075   Connection header, that request becomes the last one for the
2076   connection.
2077</t>
2078<t>
2079   Clients and servers &SHOULD-NOT;  assume that a persistent connection is
2080   maintained for HTTP versions less than 1.1 unless it is explicitly
2081   signaled. See <xref target="compatibility.with.http.1.0.persistent.connections"/> for more information on backward
2082   compatibility with HTTP/1.0 clients.
2083</t>
2084<t>
2085   In order to remain persistent, all messages on the connection &MUST;
2086   have a self-defined message length (i.e., one not defined by closure
2087   of the connection), as described in <xref target="message.length"/>.
2088</t>
2089</section>
2090
2091<section title="Pipelining" anchor="pipelining">
2092<t>
2093   A client that supports persistent connections &MAY; "pipeline" its
2094   requests (i.e., send multiple requests without waiting for each
2095   response). A server &MUST; send its responses to those requests in the
2096   same order that the requests were received.
2097</t>
2098<t>
2099   Clients which assume persistent connections and pipeline immediately
2100   after connection establishment &SHOULD; be prepared to retry their
2101   connection if the first pipelined attempt fails. If a client does
2102   such a retry, it &MUST-NOT; pipeline before it knows the connection is
2103   persistent. Clients &MUST; also be prepared to resend their requests if
2104   the server closes the connection before sending all of the
2105   corresponding responses.
2106</t>
2107<t>
2108   Clients &SHOULD-NOT;  pipeline requests using non-idempotent methods or
2109   non-idempotent sequences of methods (see &idempotent-methods;). Otherwise, a
2110   premature termination of the transport connection could lead to
2111   indeterminate results. A client wishing to send a non-idempotent
2112   request &SHOULD; wait to send that request until it has received the
2113   response status for the previous request.
2114</t>
2115</section>
2116</section>
2117
2118<section title="Proxy Servers" anchor="persistent.proxy">
2119<t>
2120   It is especially important that proxies correctly implement the
2121   properties of the Connection header field as specified in <xref target="header.connection"/>.
2122</t>
2123<t>
2124   The proxy server &MUST; signal persistent connections separately with
2125   its clients and the origin servers (or other proxy servers) that it
2126   connects to. Each persistent connection applies to only one transport
2127   link.
2128</t>
2129<t>
2130   A proxy server &MUST-NOT; establish a HTTP/1.1 persistent connection
2131   with an HTTP/1.0 client (but see <xref target="RFC2068"/> for information and
2132   discussion of the problems with the Keep-Alive header implemented by
2133   many HTTP/1.0 clients).
2134</t>
2135</section>
2136
2137<section title="Practical Considerations" anchor="persistent.practical">
2138<t>
2139   Servers will usually have some time-out value beyond which they will
2140   no longer maintain an inactive connection. Proxy servers might make
2141   this a higher value since it is likely that the client will be making
2142   more connections through the same server. The use of persistent
2143   connections places no requirements on the length (or existence) of
2144   this time-out for either the client or the server.
2145</t>
2146<t>
2147   When a client or server wishes to time-out it &SHOULD; issue a graceful
2148   close on the transport connection. Clients and servers &SHOULD; both
2149   constantly watch for the other side of the transport close, and
2150   respond to it as appropriate. If a client or server does not detect
2151   the other side's close promptly it could cause unnecessary resource
2152   drain on the network.
2153</t>
2154<t>
2155   A client, server, or proxy &MAY; close the transport connection at any
2156   time. For example, a client might have started to send a new request
2157   at the same time that the server has decided to close the "idle"
2158   connection. From the server's point of view, the connection is being
2159   closed while it was idle, but from the client's point of view, a
2160   request is in progress.
2161</t>
2162<t>
2163   This means that clients, servers, and proxies &MUST; be able to recover
2164   from asynchronous close events. Client software &SHOULD; reopen the
2165   transport connection and retransmit the aborted sequence of requests
2166   without user interaction so long as the request sequence is
2167   idempotent (see &idempotent-methods;). Non-idempotent methods or sequences
2168   &MUST-NOT; be automatically retried, although user agents &MAY; offer a
2169   human operator the choice of retrying the request(s). Confirmation by
2170   user-agent software with semantic understanding of the application
2171   &MAY; substitute for user confirmation. The automatic retry &SHOULD-NOT; 
2172   be repeated if the second sequence of requests fails.
2173</t>
2174<t>
2175   Servers &SHOULD; always respond to at least one request per connection,
2176   if at all possible. Servers &SHOULD-NOT;  close a connection in the
2177   middle of transmitting a response, unless a network or client failure
2178   is suspected.
2179</t>
2180<t>
2181   Clients that use persistent connections &SHOULD; limit the number of
2182   simultaneous connections that they maintain to a given server. A
2183   single-user client &SHOULD-NOT; maintain more than 2 connections with
2184   any server or proxy. A proxy &SHOULD; use up to 2*N connections to
2185   another server or proxy, where N is the number of simultaneously
2186   active users. These guidelines are intended to improve HTTP response
2187   times and avoid congestion.
2188</t>
2189</section>
2190</section>
2191
2192<section title="Message Transmission Requirements" anchor="message.transmission.requirements">
2193
2194<section title="Persistent Connections and Flow Control" anchor="persistent.flow">
2195<t>
2196   HTTP/1.1 servers &SHOULD; maintain persistent connections and use TCP's
2197   flow control mechanisms to resolve temporary overloads, rather than
2198   terminating connections with the expectation that clients will retry.
2199   The latter technique can exacerbate network congestion.
2200</t>
2201</section>
2202
2203<section title="Monitoring Connections for Error Status Messages" anchor="persistent.monitor">
2204<t>
2205   An HTTP/1.1 (or later) client sending a message-body &SHOULD; monitor
2206   the network connection for an error status while it is transmitting
2207   the request. If the client sees an error status, it &SHOULD;
2208   immediately cease transmitting the body. If the body is being sent
2209   using a "chunked" encoding (<xref target="transfer.codings"/>), a zero length chunk and
2210   empty trailer &MAY; be used to prematurely mark the end of the message.
2211   If the body was preceded by a Content-Length header, the client &MUST;
2212   close the connection.
2213</t>
2214</section>
2215
2216<section title="Use of the 100 (Continue) Status" anchor="use.of.the.100.status">
2217<t>
2218   The purpose of the 100 (Continue) status (see &status-100;) is to
2219   allow a client that is sending a request message with a request body
2220   to determine if the origin server is willing to accept the request
2221   (based on the request headers) before the client sends the request
2222   body. In some cases, it might either be inappropriate or highly
2223   inefficient for the client to send the body if the server will reject
2224   the message without looking at the body.
2225</t>
2226<t>
2227   Requirements for HTTP/1.1 clients:
2228  <list style="symbols">
2229    <t>
2230        If a client will wait for a 100 (Continue) response before
2231        sending the request body, it &MUST; send an Expect request-header
2232        field (&header-expect;) with the "100-continue" expectation.
2233    </t>
2234    <t>
2235        A client &MUST-NOT; send an Expect request-header field (&header-expect;)
2236        with the "100-continue" expectation if it does not intend
2237        to send a request body.
2238    </t>
2239  </list>
2240</t>
2241<t>
2242   Because of the presence of older implementations, the protocol allows
2243   ambiguous situations in which a client may send "Expect: 100-continue"
2244   without receiving either a 417 (Expectation Failed) status
2245   or a 100 (Continue) status. Therefore, when a client sends this
2246   header field to an origin server (possibly via a proxy) from which it
2247   has never seen a 100 (Continue) status, the client &SHOULD-NOT;  wait
2248   for an indefinite period before sending the request body.
2249</t>
2250<t>
2251   Requirements for HTTP/1.1 origin servers:
2252  <list style="symbols">
2253    <t> Upon receiving a request which includes an Expect request-header
2254        field with the "100-continue" expectation, an origin server &MUST;
2255        either respond with 100 (Continue) status and continue to read
2256        from the input stream, or respond with a final status code. The
2257        origin server &MUST-NOT; wait for the request body before sending
2258        the 100 (Continue) response. If it responds with a final status
2259        code, it &MAY; close the transport connection or it &MAY; continue
2260        to read and discard the rest of the request.  It &MUST-NOT;
2261        perform the requested method if it returns a final status code.
2262    </t>
2263    <t> An origin server &SHOULD-NOT;  send a 100 (Continue) response if
2264        the request message does not include an Expect request-header
2265        field with the "100-continue" expectation, and &MUST-NOT; send a
2266        100 (Continue) response if such a request comes from an HTTP/1.0
2267        (or earlier) client. There is an exception to this rule: for
2268        compatibility with <xref target="RFC2068"/>, a server &MAY; send a 100 (Continue)
2269        status in response to an HTTP/1.1 PUT or POST request that does
2270        not include an Expect request-header field with the "100-continue"
2271        expectation. This exception, the purpose of which is
2272        to minimize any client processing delays associated with an
2273        undeclared wait for 100 (Continue) status, applies only to
2274        HTTP/1.1 requests, and not to requests with any other HTTP-version
2275        value.
2276    </t>
2277    <t> An origin server &MAY; omit a 100 (Continue) response if it has
2278        already received some or all of the request body for the
2279        corresponding request.
2280    </t>
2281    <t> An origin server that sends a 100 (Continue) response &MUST;
2282    ultimately send a final status code, once the request body is
2283        received and processed, unless it terminates the transport
2284        connection prematurely.
2285    </t>
2286    <t> If an origin server receives a request that does not include an
2287        Expect request-header field with the "100-continue" expectation,
2288        the request includes a request body, and the server responds
2289        with a final status code before reading the entire request body
2290        from the transport connection, then the server &SHOULD-NOT;  close
2291        the transport connection until it has read the entire request,
2292        or until the client closes the connection. Otherwise, the client
2293        might not reliably receive the response message. However, this
2294        requirement is not be construed as preventing a server from
2295        defending itself against denial-of-service attacks, or from
2296        badly broken client implementations.
2297      </t>
2298    </list>
2299</t>
2300<t>
2301   Requirements for HTTP/1.1 proxies:
2302  <list style="symbols">
2303    <t> If a proxy receives a request that includes an Expect request-header
2304        field with the "100-continue" expectation, and the proxy
2305        either knows that the next-hop server complies with HTTP/1.1 or
2306        higher, or does not know the HTTP version of the next-hop
2307        server, it &MUST; forward the request, including the Expect header
2308        field.
2309    </t>
2310    <t> If the proxy knows that the version of the next-hop server is
2311        HTTP/1.0 or lower, it &MUST-NOT; forward the request, and it &MUST;
2312        respond with a 417 (Expectation Failed) status.
2313    </t>
2314    <t> Proxies &SHOULD; maintain a cache recording the HTTP version
2315        numbers received from recently-referenced next-hop servers.
2316    </t>
2317    <t> A proxy &MUST-NOT; forward a 100 (Continue) response if the
2318        request message was received from an HTTP/1.0 (or earlier)
2319        client and did not include an Expect request-header field with
2320        the "100-continue" expectation. This requirement overrides the
2321        general rule for forwarding of 1xx responses (see &status-1xx;).
2322    </t>
2323  </list>
2324</t>
2325</section>
2326
2327<section title="Client Behavior if Server Prematurely Closes Connection" anchor="connection.premature">
2328<t>
2329   If an HTTP/1.1 client sends a request which includes a request body,
2330   but which does not include an Expect request-header field with the
2331   "100-continue" expectation, and if the client is not directly
2332   connected to an HTTP/1.1 origin server, and if the client sees the
2333   connection close before receiving any status from the server, the
2334   client &SHOULD; retry the request.  If the client does retry this
2335   request, it &MAY; use the following "binary exponential backoff"
2336   algorithm to be assured of obtaining a reliable response:
2337  <list style="numbers">
2338    <t>
2339      Initiate a new connection to the server
2340    </t>
2341    <t>
2342      Transmit the request-headers
2343    </t>
2344    <t>
2345      Initialize a variable R to the estimated round-trip time to the
2346         server (e.g., based on the time it took to establish the
2347         connection), or to a constant value of 5 seconds if the round-trip
2348         time is not available.
2349    </t>
2350    <t>
2351       Compute T = R * (2**N), where N is the number of previous
2352         retries of this request.
2353    </t>
2354    <t>
2355       Wait either for an error response from the server, or for T
2356         seconds (whichever comes first)
2357    </t>
2358    <t>
2359       If no error response is received, after T seconds transmit the
2360         body of the request.
2361    </t>
2362    <t>
2363       If client sees that the connection is closed prematurely,
2364         repeat from step 1 until the request is accepted, an error
2365         response is received, or the user becomes impatient and
2366         terminates the retry process.
2367    </t>
2368  </list>
2369</t>
2370<t>
2371   If at any point an error status is received, the client
2372  <list style="symbols">
2373      <t>&SHOULD-NOT;  continue and</t>
2374
2375      <t>&SHOULD; close the connection if it has not completed sending the
2376        request message.</t>
2377    </list>
2378</t>
2379</section>
2380</section>
2381</section>
2382
2383
2384<section title="Header Field Definitions" anchor="header.fields">
2385<t>
2386   This section defines the syntax and semantics of HTTP/1.1 header fields
2387   related to message framing and transport protocols.
2388</t>
2389<t>
2390   For entity-header fields, both sender and recipient refer to either the
2391   client or the server, depending on who sends and who receives the entity.
2392</t>
2393
2394<section title="Connection" anchor="header.connection">
2395  <iref primary="true" item="Connection header" x:for-anchor=""/>
2396  <iref primary="true" item="Headers" subitem="Connection" x:for-anchor=""/>
2397  <x:anchor-alias value="Connection"/>
2398  <x:anchor-alias value="connection-token"/>
2399<t>
2400   The Connection general-header field allows the sender to specify
2401   options that are desired for that particular connection and &MUST-NOT;
2402   be communicated by proxies over further connections.
2403</t>
2404<t>
2405   The Connection header has the following grammar:
2406</t>
2407<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Connection"/><iref primary="true" item="Grammar" subitem="connection-token"/>
2408  <x:ref>Connection</x:ref> = "Connection" ":" 1#(<x:ref>connection-token</x:ref>)
2409  <x:ref>connection-token</x:ref>  = <x:ref>token</x:ref>
2410</artwork></figure>
2411<t>
2412   HTTP/1.1 proxies &MUST; parse the Connection header field before a
2413   message is forwarded and, for each connection-token in this field,
2414   remove any header field(s) from the message with the same name as the
2415   connection-token. Connection options are signaled by the presence of
2416   a connection-token in the Connection header field, not by any
2417   corresponding additional header field(s), since the additional header
2418   field may not be sent if there are no parameters associated with that
2419   connection option.
2420</t>
2421<t>
2422   Message headers listed in the Connection header &MUST-NOT; include
2423   end-to-end headers, such as Cache-Control.
2424</t>
2425<t>
2426   HTTP/1.1 defines the "close" connection option for the sender to
2427   signal that the connection will be closed after completion of the
2428   response. For example,
2429</t>
2430<figure><artwork type="example">
2431    Connection: close
2432</artwork></figure>
2433<t>
2434   in either the request or the response header fields indicates that
2435   the connection &SHOULD-NOT;  be considered `persistent' (<xref target="persistent.connections"/>)
2436   after the current request/response is complete.
2437</t>
2438<t>
2439   An HTTP/1.1 client that does not support persistent connections &MUST;
2440   include the "close" connection option in every request message.
2441</t>
2442<t>
2443   An HTTP/1.1 server that does not support persistent connections &MUST;
2444   include the "close" connection option in every response message that
2445   does not have a 1xx (informational) status code.
2446</t>
2447<t>
2448   A system receiving an HTTP/1.0 (or lower-version) message that
2449   includes a Connection header &MUST;, for each connection-token in this
2450   field, remove and ignore any header field(s) from the message with
2451   the same name as the connection-token. This protects against mistaken
2452   forwarding of such header fields by pre-HTTP/1.1 proxies. See <xref target="compatibility.with.http.1.0.persistent.connections"/>.
2453</t>
2454</section>
2455
2456<section title="Content-Length" anchor="header.content-length">
2457  <iref primary="true" item="Content-Length header" x:for-anchor=""/>
2458  <iref primary="true" item="Headers" subitem="Content-Length" x:for-anchor=""/>
2459  <x:anchor-alias value="Content-Length"/>
2460<t>
2461   The Content-Length entity-header field indicates the size of the
2462   entity-body, in decimal number of OCTETs, sent to the recipient or,
2463   in the case of the HEAD method, the size of the entity-body that
2464   would have been sent had the request been a GET.
2465</t>
2466<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Content-Length"/>
2467  <x:ref>Content-Length</x:ref>    = "Content-Length" ":" 1*<x:ref>DIGIT</x:ref>
2468</artwork></figure>
2469<t>
2470   An example is
2471</t>
2472<figure><artwork type="example">
2473    Content-Length: 3495
2474</artwork></figure>
2475<t>
2476   Applications &SHOULD; use this field to indicate the transfer-length of
2477   the message-body, unless this is prohibited by the rules in <xref target="message.length"/>.
2478</t>
2479<t>
2480   Any Content-Length greater than or equal to zero is a valid value.
2481   <xref target="message.length"/> describes how to determine the length of a message-body
2482   if a Content-Length is not given.
2483</t>
2484<t>
2485   Note that the meaning of this field is significantly different from
2486   the corresponding definition in MIME, where it is an optional field
2487   used within the "message/external-body" content-type. In HTTP, it
2488   &SHOULD; be sent whenever the message's length can be determined prior
2489   to being transferred, unless this is prohibited by the rules in
2490   <xref target="message.length"/>.
2491</t>
2492</section>
2493
2494<section title="Date" anchor="header.date">
2495  <iref primary="true" item="Date header" x:for-anchor=""/>
2496  <iref primary="true" item="Headers" subitem="Date" x:for-anchor=""/>
2497  <x:anchor-alias value="Date"/>
2498<t>
2499   The Date general-header field represents the date and time at which
2500   the message was originated, having the same semantics as orig-date in
2501   <xref target="RFC2822" x:fmt="of" x:sec="3.6.1"/>. The field value is an HTTP-date, as described in <xref target="full.date"/>;
2502   it &MUST; be sent in rfc1123-date format.
2503</t>
2504<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Date"/>
2505  <x:ref>Date</x:ref>  = "Date" ":" <x:ref>HTTP-date</x:ref>
2506</artwork></figure>
2507<t>
2508   An example is
2509</t>
2510<figure><artwork type="example">
2511    Date: Tue, 15 Nov 1994 08:12:31 GMT
2512</artwork></figure>
2513<t>
2514   Origin servers &MUST; include a Date header field in all responses,
2515   except in these cases:
2516  <list style="numbers">
2517      <t>If the response status code is 100 (Continue) or 101 (Switching
2518         Protocols), the response &MAY; include a Date header field, at
2519         the server's option.</t>
2520
2521      <t>If the response status code conveys a server error, e.g. 500
2522         (Internal Server Error) or 503 (Service Unavailable), and it is
2523         inconvenient or impossible to generate a valid Date.</t>
2524
2525      <t>If the server does not have a clock that can provide a
2526         reasonable approximation of the current time, its responses
2527         &MUST-NOT; include a Date header field. In this case, the rules
2528         in <xref target="clockless.origin.server.operation"/> &MUST; be followed.</t>
2529  </list>
2530</t>
2531<t>
2532   A received message that does not have a Date header field &MUST; be
2533   assigned one by the recipient if the message will be cached by that
2534   recipient or gatewayed via a protocol which requires a Date. An HTTP
2535   implementation without a clock &MUST-NOT; cache responses without
2536   revalidating them on every use. An HTTP cache, especially a shared
2537   cache, &SHOULD; use a mechanism, such as NTP <xref target="RFC1305"/>, to synchronize its
2538   clock with a reliable external standard.
2539</t>
2540<t>
2541   Clients &SHOULD; only send a Date header field in messages that include
2542   an entity-body, as in the case of the PUT and POST requests, and even
2543   then it is optional. A client without a clock &MUST-NOT; send a Date
2544   header field in a request.
2545</t>
2546<t>
2547   The HTTP-date sent in a Date header &SHOULD-NOT;  represent a date and
2548   time subsequent to the generation of the message. It &SHOULD; represent
2549   the best available approximation of the date and time of message
2550   generation, unless the implementation has no means of generating a
2551   reasonably accurate date and time. In theory, the date ought to
2552   represent the moment just before the entity is generated. In
2553   practice, the date can be generated at any time during the message
2554   origination without affecting its semantic value.
2555</t>
2556
2557<section title="Clockless Origin Server Operation" anchor="clockless.origin.server.operation">
2558<t>
2559   Some origin server implementations might not have a clock available.
2560   An origin server without a clock &MUST-NOT; assign Expires or Last-Modified
2561   values to a response, unless these values were associated
2562   with the resource by a system or user with a reliable clock. It &MAY;
2563   assign an Expires value that is known, at or before server
2564   configuration time, to be in the past (this allows "pre-expiration"
2565   of responses without storing separate Expires values for each
2566   resource).
2567</t>
2568</section>
2569</section>
2570
2571<section title="Host" anchor="header.host">
2572  <iref primary="true" item="Host header" x:for-anchor=""/>
2573  <iref primary="true" item="Headers" subitem="Host" x:for-anchor=""/>
2574  <x:anchor-alias value="Host"/>
2575<t>
2576   The Host request-header field specifies the Internet host and port
2577   number of the resource being requested, as obtained from the original
2578   URI given by the user or referring resource (generally an HTTP URL,
2579   as described in <xref target="http.url"/>). The Host field value &MUST; represent
2580   the naming authority of the origin server or gateway given by the
2581   original URL. This allows the origin server or gateway to
2582   differentiate between internally-ambiguous URLs, such as the root "/"
2583   URL of a server for multiple host names on a single IP address.
2584</t>
2585<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Host"/>
2586  <x:ref>Host</x:ref> = "Host" ":" <x:ref>uri-host</x:ref> [ ":" <x:ref>port</x:ref> ] ; <xref target="http.url"/>
2587</artwork></figure>
2588<t>
2589   A "host" without any trailing port information implies the default
2590   port for the service requested (e.g., "80" for an HTTP URL). For
2591   example, a request on the origin server for
2592   &lt;http://www.example.org/pub/WWW/&gt; would properly include:
2593</t>
2594<figure><artwork type="example">
2595    GET /pub/WWW/ HTTP/1.1
2596    Host: www.example.org
2597</artwork></figure>
2598<t>
2599   A client &MUST; include a Host header field in all HTTP/1.1 request
2600   messages. If the requested URI does not include an Internet host
2601   name for the service being requested, then the Host header field &MUST;
2602   be given with an empty value. An HTTP/1.1 proxy &MUST; ensure that any
2603   request message it forwards does contain an appropriate Host header
2604   field that identifies the service being requested by the proxy. All
2605   Internet-based HTTP/1.1 servers &MUST; respond with a 400 (Bad Request)
2606   status code to any HTTP/1.1 request message which lacks a Host header
2607   field.
2608</t>
2609<t>
2610   See Sections <xref target="the.resource.identified.by.a.request" format="counter"/>
2611   and <xref target="changes.to.simplify.multi-homed.web.servers.and.conserve.ip.addresses" format="counter"/>
2612   for other requirements relating to Host.
2613</t>
2614</section>
2615
2616<section title="TE" anchor="header.te">
2617  <iref primary="true" item="TE header" x:for-anchor=""/>
2618  <iref primary="true" item="Headers" subitem="TE" x:for-anchor=""/>
2619  <x:anchor-alias value="TE"/>
2620  <x:anchor-alias value="t-codings"/>
2621<t>
2622   The TE request-header field indicates what extension transfer-codings
2623   it is willing to accept in the response and whether or not it is
2624   willing to accept trailer fields in a chunked transfer-coding. Its
2625   value may consist of the keyword "trailers" and/or a comma-separated
2626   list of extension transfer-coding names with optional accept
2627   parameters (as described in <xref target="transfer.codings"/>).
2628</t>
2629<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="TE"/><iref primary="true" item="Grammar" subitem="t-codings"/>
2630  <x:ref>TE</x:ref>        = "TE" ":" #( <x:ref>t-codings</x:ref> )
2631  <x:ref>t-codings</x:ref> = "trailers" | ( <x:ref>transfer-extension</x:ref> [ <x:ref>accept-params</x:ref> ] )
2632</artwork></figure>
2633<t>
2634   The presence of the keyword "trailers" indicates that the client is
2635   willing to accept trailer fields in a chunked transfer-coding, as
2636   defined in <xref target="chunked.transfer.encoding"/>. This keyword is reserved for use with
2637   transfer-coding values even though it does not itself represent a
2638   transfer-coding.
2639</t>
2640<t>
2641   Examples of its use are:
2642</t>
2643<figure><artwork type="example">
2644    TE: deflate
2645    TE:
2646    TE: trailers, deflate;q=0.5
2647</artwork></figure>
2648<t>
2649   The TE header field only applies to the immediate connection.
2650   Therefore, the keyword &MUST; be supplied within a Connection header
2651   field (<xref target="header.connection"/>) whenever TE is present in an HTTP/1.1 message.
2652</t>
2653<t>
2654   A server tests whether a transfer-coding is acceptable, according to
2655   a TE field, using these rules:
2656  <list style="numbers">
2657    <x:lt>
2658      <t>The "chunked" transfer-coding is always acceptable. If the
2659         keyword "trailers" is listed, the client indicates that it is
2660         willing to accept trailer fields in the chunked response on
2661         behalf of itself and any downstream clients. The implication is
2662         that, if given, the client is stating that either all
2663         downstream clients are willing to accept trailer fields in the
2664         forwarded response, or that it will attempt to buffer the
2665         response on behalf of downstream recipients.
2666      </t><t>
2667         <x:h>Note:</x:h> HTTP/1.1 does not define any means to limit the size of a
2668         chunked response such that a client can be assured of buffering
2669         the entire response.</t>
2670    </x:lt>
2671    <x:lt>
2672      <t>If the transfer-coding being tested is one of the transfer-codings
2673         listed in the TE field, then it is acceptable unless it
2674         is accompanied by a qvalue of 0. (As defined in &qvalue;, a
2675         qvalue of 0 means "not acceptable.")</t>
2676    </x:lt>
2677    <x:lt>
2678      <t>If multiple transfer-codings are acceptable, then the
2679         acceptable transfer-coding with the highest non-zero qvalue is
2680         preferred.  The "chunked" transfer-coding always has a qvalue
2681         of 1.</t>
2682    </x:lt>
2683  </list>
2684</t>
2685<t>
2686   If the TE field-value is empty or if no TE field is present, the only
2687   transfer-coding  is "chunked". A message with no transfer-coding is
2688   always acceptable.
2689</t>
2690</section>
2691
2692<section title="Trailer" anchor="header.trailer">
2693  <iref primary="true" item="Trailer header" x:for-anchor=""/>
2694  <iref primary="true" item="Headers" subitem="Trailer" x:for-anchor=""/>
2695  <x:anchor-alias value="Trailer"/>
2696<t>
2697   The Trailer general field value indicates that the given set of
2698   header fields is present in the trailer of a message encoded with
2699   chunked transfer-coding.
2700</t>
2701<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Trailer"/>
2702  <x:ref>Trailer</x:ref>  = "Trailer" ":" 1#<x:ref>field-name</x:ref>
2703</artwork></figure>
2704<t>
2705   An HTTP/1.1 message &SHOULD; include a Trailer header field in a
2706   message using chunked transfer-coding with a non-empty trailer. Doing
2707   so allows the recipient to know which header fields to expect in the
2708   trailer.
2709</t>
2710<t>
2711   If no Trailer header field is present, the trailer &SHOULD-NOT;  include
2712   any header fields. See <xref target="chunked.transfer.encoding"/> for restrictions on the use of
2713   trailer fields in a "chunked" transfer-coding.
2714</t>
2715<t>
2716   Message header fields listed in the Trailer header field &MUST-NOT;
2717   include the following header fields:
2718  <list style="symbols">
2719    <t>Transfer-Encoding</t>
2720    <t>Content-Length</t>
2721    <t>Trailer</t>
2722  </list>
2723</t>
2724</section>
2725
2726<section title="Transfer-Encoding" anchor="header.transfer-encoding">
2727  <iref primary="true" item="Transfer-Encoding header" x:for-anchor=""/>
2728  <iref primary="true" item="Headers" subitem="Transfer-Encoding" x:for-anchor=""/>
2729  <x:anchor-alias value="Transfer-Encoding"/>
2730<t>
2731   The Transfer-Encoding general-header field indicates what (if any)
2732   type of transformation has been applied to the message body in order
2733   to safely transfer it between the sender and the recipient. This
2734   differs from the content-coding in that the transfer-coding is a
2735   property of the message, not of the entity.
2736</t>
2737<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Transfer-Encoding"/>
2738  <x:ref>Transfer-Encoding</x:ref>       = "Transfer-Encoding" ":" 1#<x:ref>transfer-coding</x:ref>
2739</artwork></figure>
2740<t>
2741   Transfer-codings are defined in <xref target="transfer.codings"/>. An example is:
2742</t>
2743<figure><artwork type="example">
2744  Transfer-Encoding: chunked
2745</artwork></figure>
2746<t>
2747   If multiple encodings have been applied to an entity, the transfer-codings
2748   &MUST; be listed in the order in which they were applied.
2749   Additional information about the encoding parameters &MAY; be provided
2750   by other entity-header fields not defined by this specification.
2751</t>
2752<t>
2753   Many older HTTP/1.0 applications do not understand the Transfer-Encoding
2754   header.
2755</t>
2756</section>
2757
2758<section title="Upgrade" anchor="header.upgrade">
2759  <iref primary="true" item="Upgrade header" x:for-anchor=""/>
2760  <iref primary="true" item="Headers" subitem="Upgrade" x:for-anchor=""/>
2761  <x:anchor-alias value="Upgrade"/>
2762<t>
2763   The Upgrade general-header allows the client to specify what
2764   additional communication protocols it supports and would like to use
2765   if the server finds it appropriate to switch protocols. The server
2766   &MUST; use the Upgrade header field within a 101 (Switching Protocols)
2767   response to indicate which protocol(s) are being switched.
2768</t>
2769<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Upgrade"/>
2770  <x:ref>Upgrade</x:ref>        = "Upgrade" ":" 1#<x:ref>product</x:ref>
2771</artwork></figure>
2772<t>
2773   For example,
2774</t>
2775<figure><artwork type="example">
2776    Upgrade: HTTP/2.0, SHTTP/1.3, IRC/6.9, RTA/x11
2777</artwork></figure>
2778<t>
2779   The Upgrade header field is intended to provide a simple mechanism
2780   for transition from HTTP/1.1 to some other, incompatible protocol. It
2781   does so by allowing the client to advertise its desire to use another
2782   protocol, such as a later version of HTTP with a higher major version
2783   number, even though the current request has been made using HTTP/1.1.
2784   This eases the difficult transition between incompatible protocols by
2785   allowing the client to initiate a request in the more commonly
2786   supported protocol while indicating to the server that it would like
2787   to use a "better" protocol if available (where "better" is determined
2788   by the server, possibly according to the nature of the method and/or
2789   resource being requested).
2790</t>
2791<t>
2792   The Upgrade header field only applies to switching application-layer
2793   protocols upon the existing transport-layer connection. Upgrade
2794   cannot be used to insist on a protocol change; its acceptance and use
2795   by the server is optional. The capabilities and nature of the
2796   application-layer communication after the protocol change is entirely
2797   dependent upon the new protocol chosen, although the first action
2798   after changing the protocol &MUST; be a response to the initial HTTP
2799   request containing the Upgrade header field.
2800</t>
2801<t>
2802   The Upgrade header field only applies to the immediate connection.
2803   Therefore, the upgrade keyword &MUST; be supplied within a Connection
2804   header field (<xref target="header.connection"/>) whenever Upgrade is present in an
2805   HTTP/1.1 message.
2806</t>
2807<t>
2808   The Upgrade header field cannot be used to indicate a switch to a
2809   protocol on a different connection. For that purpose, it is more
2810   appropriate to use a 301, 302, 303, or 305 redirection response.
2811</t>
2812<t>
2813   This specification only defines the protocol name "HTTP" for use by
2814   the family of Hypertext Transfer Protocols, as defined by the HTTP
2815   version rules of <xref target="http.version"/> and future updates to this
2816   specification. Any token can be used as a protocol name; however, it
2817   will only be useful if both the client and server associate the name
2818   with the same protocol.
2819</t>
2820</section>
2821
2822<section title="Via" anchor="header.via">
2823  <iref primary="true" item="Via header" x:for-anchor=""/>
2824  <iref primary="true" item="Headers" subitem="Via" x:for-anchor=""/>
2825  <x:anchor-alias value="protocol-name"/>
2826  <x:anchor-alias value="protocol-version"/>
2827  <x:anchor-alias value="pseudonym"/>
2828  <x:anchor-alias value="received-by"/>
2829  <x:anchor-alias value="received-protocol"/>
2830  <x:anchor-alias value="Via"/>
2831<t>
2832   The Via general-header field &MUST; be used by gateways and proxies to
2833   indicate the intermediate protocols and recipients between the user
2834   agent and the server on requests, and between the origin server and
2835   the client on responses. It is analogous to the "Received" field defined in
2836   <xref target="RFC2822" x:fmt="of" x:sec="3.6.7"/> and is intended to be used for tracking message forwards,
2837   avoiding request loops, and identifying the protocol capabilities of
2838   all senders along the request/response chain.
2839</t>
2840<figure><artwork type="abnf2616"><iref primary="true" item="Grammar" subitem="Via"/><iref primary="true" item="Grammar" subitem="received-protocol"/><iref primary="true" item="Grammar" subitem="protocol-name"/><iref primary="true" item="Grammar" subitem="protocol-version"/><iref primary="true" item="Grammar" subitem="received-by"/><iref primary="true" item="Grammar" subitem="pseudonym"/>
2841  <x:ref>Via</x:ref> =  "Via" ":" 1#( <x:ref>received-protocol</x:ref> <x:ref>received-by</x:ref> [ <x:ref>comment</x:ref> ] )
2842  <x:ref>received-protocol</x:ref> = [ <x:ref>protocol-name</x:ref> "/" ] <x:ref>protocol-version</x:ref>
2843  <x:ref>protocol-name</x:ref>     = <x:ref>token</x:ref>
2844  <x:ref>protocol-version</x:ref>  = <x:ref>token</x:ref>
2845  <x:ref>received-by</x:ref>       = ( <x:ref>uri-host</x:ref> [ ":" <x:ref>port</x:ref> ] ) | <x:ref>pseudonym</x:ref>
2846  <x:ref>pseudonym</x:ref>         = <x:ref>token</x:ref>
2847</artwork></figure>
2848<t>
2849   The received-protocol indicates the protocol version of the message
2850   received by the server or client along each segment of the
2851   request/response chain. The received-protocol version is appended to
2852   the Via field value when the message is forwarded so that information
2853   about the protocol capabilities of upstream applications remains
2854   visible to all recipients.
2855</t>
2856<t>
2857   The protocol-name is optional if and only if it would be "HTTP". The
2858   received-by field is normally the host and optional port number of a
2859   recipient server or client that subsequently forwarded the message.
2860   However, if the real host is considered to be sensitive information,
2861   it &MAY; be replaced by a pseudonym. If the port is not given, it &MAY;
2862   be assumed to be the default port of the received-protocol.
2863</t>
2864<t>
2865   Multiple Via field values represents each proxy or gateway that has
2866   forwarded the message. Each recipient &MUST; append its information
2867   such that the end result is ordered according to the sequence of
2868   forwarding applications.
2869</t>
2870<t>
2871   Comments &MAY; be used in the Via header field to identify the software
2872   of the recipient proxy or gateway, analogous to the User-Agent and
2873   Server header fields. However, all comments in the Via field are
2874   optional and &MAY; be removed by any recipient prior to forwarding the
2875   message.
2876</t>
2877<t>
2878   For example, a request message could be sent from an HTTP/1.0 user
2879   agent to an internal proxy code-named "fred", which uses HTTP/1.1 to
2880   forward the request to a public proxy at p.example.net, which completes
2881   the request by forwarding it to the origin server at www.example.com.
2882   The request received by www.example.com would then have the following
2883   Via header field:
2884</t>
2885<figure><artwork type="example">
2886    Via: 1.0 fred, 1.1 p.example.net (Apache/1.1)
2887</artwork></figure>
2888<t>
2889   Proxies and gateways used as a portal through a network firewall
2890   &SHOULD-NOT;, by default, forward the names and ports of hosts within
2891   the firewall region. This information &SHOULD; only be propagated if
2892   explicitly enabled. If not enabled, the received-by host of any host
2893   behind the firewall &SHOULD; be replaced by an appropriate pseudonym
2894   for that host.
2895</t>
2896<t>
2897   For organizations that have strong privacy requirements for hiding
2898   internal structures, a proxy &MAY; combine an ordered subsequence of
2899   Via header field entries with identical received-protocol values into
2900   a single such entry. For example,
2901</t>
2902<figure><artwork type="example">
2903    Via: 1.0 ricky, 1.1 ethel, 1.1 fred, 1.0 lucy
2904</artwork></figure>
2905<t>
2906        could be collapsed to
2907</t>
2908<figure><artwork type="example">
2909    Via: 1.0 ricky, 1.1 mertz, 1.0 lucy
2910</artwork></figure>
2911<t>
2912   Applications &SHOULD-NOT;  combine multiple entries unless they are all
2913   under the same organizational control and the hosts have already been
2914   replaced by pseudonyms. Applications &MUST-NOT; combine entries which
2915   have different received-protocol values.
2916</t>
2917</section>
2918
2919</section>
2920
2921<section title="IANA Considerations" anchor="IANA.considerations">
2922<section title="Message Header Registration" anchor="message.header.registration">
2923<!--AUTOGENERATED FROM extract-header-defs.xslt, do not edit manually-->
2924<!--(START)-->
2925<t>
2926    The Message Header Registry located at <eref target="http://www.iana.org/assignments/message-headers/message-header-index.html"/> should be updated
2927    with the permanent registrations below (see <xref target="RFC3864"/>):
2928</t>
2929<texttable>
2930   <ttcol>Header Field Name</ttcol>
2931   <ttcol>Protocol</ttcol>
2932   <ttcol>Status</ttcol>
2933   <ttcol>Reference</ttcol>
2934
2935   <c>Connection</c>
2936   <c>http</c>
2937   <c>standard</c>
2938   <c>
2939      <xref target="header.connection"/>
2940   </c>
2941
2942   <c>Content-Length</c>
2943   <c>http</c>
2944   <c>standard</c>
2945   <c>
2946      <xref target="header.content-length"/>
2947   </c>
2948
2949   <c>Date</c>
2950   <c>http</c>
2951   <c>standard</c>
2952   <c>
2953      <xref target="header.date"/>
2954   </c>
2955
2956   <c>Host</c>
2957   <c>http</c>
2958   <c>standard</c>
2959   <c>
2960      <xref target="header.host"/>
2961   </c>
2962
2963   <c>TE</c>
2964   <c>http</c>
2965   <c>standard</c>
2966   <c>
2967      <xref target="header.te"/>
2968   </c>
2969
2970   <c>Trailer</c>
2971   <c>http</c>
2972   <c>standard</c>
2973   <c>
2974      <xref target="header.trailer"/>
2975   </c>
2976
2977   <c>Transfer-Encoding</c>
2978   <c>http</c>
2979   <c>standard</c>
2980   <c>
2981      <xref target="header.transfer-encoding"/>
2982   </c>
2983
2984   <c>Upgrade</c>
2985   <c>http</c>
2986   <c>standard</c>
2987   <c>
2988      <xref target="header.upgrade"/>
2989   </c>
2990
2991   <c>Via</c>
2992   <c>http</c>
2993   <c>standard</c>
2994   <c>
2995      <xref target="header.via"/>
2996   </c>
2997</texttable>
2998<t>
2999    The change controller is: "IETF (iesg@ietf.org) - Internet Engineering Task Force".
3000</t>
3001<!--(END)-->
3002</section>
3003</section>
3004
3005<section title="Security Considerations" anchor="security.considerations">
3006<t>
3007   This section is meant to inform application developers, information
3008   providers, and users of the security limitations in HTTP/1.1 as
3009   described by this document. The discussion does not include
3010   definitive solutions to the problems revealed, though it does make
3011   some suggestions for reducing security risks.
3012</t>
3013
3014<section title="Personal Information" anchor="personal.information">
3015<t>
3016   HTTP clients are often privy to large amounts of personal information
3017   (e.g. the user's name, location, mail address, passwords, encryption
3018   keys, etc.), and &SHOULD; be very careful to prevent unintentional
3019   leakage of this information.
3020   We very strongly recommend that a convenient interface be provided
3021   for the user to control dissemination of such information, and that
3022   designers and implementors be particularly careful in this area.
3023   History shows that errors in this area often create serious security
3024   and/or privacy problems and generate highly adverse publicity for the
3025   implementor's company.
3026</t>
3027</section>
3028
3029<section title="Abuse of Server Log Information" anchor="abuse.of.server.log.information">
3030<t>
3031   A server is in the position to save personal data about a user's
3032   requests which might identify their reading patterns or subjects of
3033   interest. This information is clearly confidential in nature and its
3034   handling can be constrained by law in certain countries. People using
3035   HTTP to provide data are responsible for ensuring that
3036   such material is not distributed without the permission of any
3037   individuals that are identifiable by the published results.
3038</t>
3039</section>
3040
3041<section title="Attacks Based On File and Path Names" anchor="attack.pathname">
3042<t>
3043   Implementations of HTTP origin servers &SHOULD; be careful to restrict
3044   the documents returned by HTTP requests to be only those that were
3045   intended by the server administrators. If an HTTP server translates
3046   HTTP URIs directly into file system calls, the server &MUST; take
3047   special care not to serve files that were not intended to be
3048   delivered to HTTP clients. For example, UNIX, Microsoft Windows, and
3049   other operating systems use ".." as a path component to indicate a
3050   directory level above the current one. On such a system, an HTTP
3051   server &MUST; disallow any such construct in the Request-URI if it
3052   would otherwise allow access to a resource outside those intended to
3053   be accessible via the HTTP server. Similarly, files intended for
3054   reference only internally to the server (such as access control
3055   files, configuration files, and script code) &MUST; be protected from
3056   inappropriate retrieval, since they might contain sensitive
3057   information. Experience has shown that minor bugs in such HTTP server
3058   implementations have turned into security risks.
3059</t>
3060</section>
3061
3062<section title="DNS Spoofing" anchor="dns.spoofing">
3063<t>
3064   Clients using HTTP rely heavily on the Domain Name Service, and are
3065   thus generally prone to security attacks based on the deliberate
3066   mis-association of IP addresses and DNS names. Clients need to be
3067   cautious in assuming the continuing validity of an IP number/DNS name
3068   association.
3069</t>
3070<t>
3071   In particular, HTTP clients &SHOULD; rely on their name resolver for
3072   confirmation of an IP number/DNS name association, rather than
3073   caching the result of previous host name lookups. Many platforms
3074   already can cache host name lookups locally when appropriate, and
3075   they &SHOULD; be configured to do so. It is proper for these lookups to
3076   be cached, however, only when the TTL (Time To Live) information
3077   reported by the name server makes it likely that the cached
3078   information will remain useful.
3079</t>
3080<t>
3081   If HTTP clients cache the results of host name lookups in order to
3082   achieve a performance improvement, they &MUST; observe the TTL
3083   information reported by DNS.
3084</t>
3085<t>
3086   If HTTP clients do not observe this rule, they could be spoofed when
3087   a previously-accessed server's IP address changes. As network
3088   renumbering is expected to become increasingly common <xref target="RFC1900"/>, the
3089   possibility of this form of attack will grow. Observing this
3090   requirement thus reduces this potential security vulnerability.
3091</t>
3092<t>
3093   This requirement also improves the load-balancing behavior of clients
3094   for replicated servers using the same DNS name and reduces the
3095   likelihood of a user's experiencing failure in accessing sites which
3096   use that strategy.
3097</t>
3098</section>
3099
3100<section title="Proxies and Caching" anchor="attack.proxies">
3101<t>
3102   By their very nature, HTTP proxies are men-in-the-middle, and
3103   represent an opportunity for man-in-the-middle attacks. Compromise of
3104   the systems on which the proxies run can result in serious security
3105   and privacy problems. Proxies have access to security-related
3106   information, personal information about individual users and
3107   organizations, and proprietary information belonging to users and
3108   content providers. A compromised proxy, or a proxy implemented or
3109   configured without regard to security and privacy considerations,
3110   might be used in the commission of a wide range of potential attacks.
3111</t>
3112<t>
3113   Proxy operators should protect the systems on which proxies run as
3114   they would protect any system that contains or transports sensitive
3115   information. In particular, log information gathered at proxies often
3116   contains highly sensitive personal information, and/or information
3117   about organizations. Log information should be carefully guarded, and
3118   appropriate guidelines for use developed and followed. (<xref target="abuse.of.server.log.information"/>).
3119</t>
3120<t>
3121   Proxy implementors should consider the privacy and security
3122   implications of their design and coding decisions, and of the
3123   configuration options they provide to proxy operators (especially the
3124   default configuration).
3125</t>
3126<t>
3127   Users of a proxy need to be aware that they are no trustworthier than
3128   the people who run the proxy; HTTP itself cannot solve this problem.
3129</t>
3130<t>
3131   The judicious use of cryptography, when appropriate, may suffice to
3132   protect against a broad range of security and privacy attacks. Such
3133   cryptography is beyond the scope of the HTTP/1.1 specification.
3134</t>
3135</section>
3136
3137<section title="Denial of Service Attacks on Proxies" anchor="attack.DoS">
3138<t>
3139   They exist. They are hard to defend against. Research continues.
3140   Beware.
3141</t>
3142</section>
3143</section>
3144
3145<section title="Acknowledgments" anchor="ack">
3146<t>
3147   This specification makes heavy use of the augmented BNF and generic
3148   constructs defined by David H. Crocker for <xref target="RFC822ABNF"/>. Similarly, it
3149   reuses many of the definitions provided by Nathaniel Borenstein and
3150   Ned Freed for MIME <xref target="RFC2045"/>. We hope that their inclusion in this
3151   specification will help reduce past confusion over the relationship
3152   between HTTP and Internet mail message formats.
3153</t>
3154<t>
3155   HTTP has evolved considerably over the years. It has
3156   benefited from a large and active developer community--the many
3157   people who have participated on the www-talk mailing list--and it is
3158   that community which has been most responsible for the success of
3159   HTTP and of the World-Wide Web in general. Marc Andreessen, Robert
3160   Cailliau, Daniel W. Connolly, Bob Denny, John Franks, Jean-Francois
3161   Groff, Phillip M. Hallam-Baker, Hakon W. Lie, Ari Luotonen, Rob
3162   McCool, Lou Montulli, Dave Raggett, Tony Sanders, and Marc
3163   VanHeyningen deserve special recognition for their efforts in
3164   defining early aspects of the protocol.
3165</t>
3166<t>
3167   This document has benefited greatly from the comments of all those
3168   participating in the HTTP-WG. In addition to those already mentioned,
3169   the following individuals have contributed to this specification:
3170</t>
3171<t>
3172   Gary Adams, Harald Tveit Alvestrand, Keith Ball, Brian Behlendorf,
3173   Paul Burchard, Maurizio Codogno, Mike Cowlishaw, Roman Czyborra,
3174   Michael A. Dolan, Daniel DuBois, David J. Fiander, Alan Freier, Marc Hedlund, Greg Herlihy,
3175   Koen Holtman, Alex Hopmann, Bob Jernigan, Shel Kaphan, Rohit Khare,
3176   John Klensin, Martijn Koster, Alexei Kosut, David M. Kristol,
3177   Daniel LaLiberte, Ben Laurie, Paul J. Leach, Albert Lunde,
3178   John C. Mallery, Jean-Philippe Martin-Flatin, Mitra, David Morris,
3179   Gavin Nicol, Ross Patterson, Bill Perry, Jeffrey Perry, Scott Powers, Owen Rees,
3180   Luigi Rizzo, David Robinson, Marc Salomon, Rich Salz,
3181   Allan M. Schiffman, Jim Seidman, Chuck Shotton, Eric W. Sink,
3182   Simon E. Spero, Richard N. Taylor, Robert S. Thau,
3183   Bill (BearHeart) Weinman, Francois Yergeau, Mary Ellen Zurko,
3184   Josh Cohen.
3185</t>
3186<t>
3187   Thanks to the "cave men" of Palo Alto. You know who you are.
3188</t>
3189<t>
3190   Jim Gettys (the editor of <xref target="RFC2616"/>) wishes particularly
3191   to thank Roy Fielding, the editor of <xref target="RFC2068"/>, along
3192   with John Klensin, Jeff Mogul, Paul Leach, Dave Kristol, Koen
3193   Holtman, John Franks, Josh Cohen, Alex Hopmann, Scott Lawrence, and
3194   Larry Masinter for their help. And thanks go particularly to Jeff
3195   Mogul and Scott Lawrence for performing the "MUST/MAY/SHOULD" audit.
3196</t>
3197<t>
3198   The Apache Group, Anselm Baird-Smith, author of Jigsaw, and Henrik
3199   Frystyk implemented RFC 2068 early, and we wish to thank them for the
3200   discovery of many of the problems that this document attempts to
3201   rectify.
3202</t>
3203</section>
3204
3205</middle>
3206<back>
3207
3208<references title="Normative References">
3209
3210<reference anchor="ISO-8859-1">
3211  <front>
3212    <title>
3213     Information technology -- 8-bit single-byte coded graphic character sets -- Part 1: Latin alphabet No. 1
3214    </title>
3215    <author>
3216      <organization>International Organization for Standardization</organization>
3217    </author>
3218    <date year="1998"/>
3219  </front>
3220  <seriesInfo name="ISO/IEC" value="8859-1:1998"/>
3221</reference>
3222
3223<reference anchor="Part2">
3224  <front>
3225    <title abbrev="HTTP/1.1">HTTP/1.1, part 2: Message Semantics</title>
3226    <author initials="R." surname="Fielding" fullname="Roy T. Fielding" role="editor">
3227      <organization abbrev="Day Software">Day Software</organization>
3228      <address><email>fielding@gbiv.com</email></address>
3229    </author>
3230    <author initials="J." surname="Gettys" fullname="Jim Gettys">
3231      <organization>One Laptop per Child</organization>
3232      <address><email>jg@laptop.org</email></address>
3233    </author>
3234    <author initials="J." surname="Mogul" fullname="Jeffrey C. Mogul">
3235      <organization abbrev="HP">Hewlett-Packard Company</organization>
3236      <address><email>JeffMogul@acm.org</email></address>
3237    </author>
3238    <author initials="H." surname="Frystyk" fullname="Henrik Frystyk Nielsen">
3239      <organization abbrev="Microsoft">Microsoft Corporation</organization>
3240      <address><email>henrikn@microsoft.com</email></address>
3241    </author>
3242    <author initials="L." surname="Masinter" fullname="Larry Masinter">
3243      <organization abbrev="Adobe Systems">Adobe Systems, Incorporated</organization>
3244      <address><email>LMM@acm.org</email></address>
3245    </author>
3246    <author initials="P." surname="Leach" fullname="Paul J. Leach">
3247      <organization abbrev="Microsoft">Microsoft Corporation</organization>
3248      <address><email>paulle@microsoft.com</email></address>
3249    </author>
3250    <author initials="T." surname="Berners-Lee" fullname="Tim Berners-Lee">
3251      <organization abbrev="W3C/MIT">World Wide Web Consortium</organization>
3252      <address><email>timbl@w3.org</email></address>
3253    </author>
3254    <author initials="Y." surname="Lafon" fullname="Yves Lafon" role="editor">
3255      <organization abbrev="W3C">World Wide Web Consortium</organization>
3256      <address><email>ylafon@w3.org</email></address>
3257    </author>
3258    <author initials="J. F." surname="Reschke" fullname="Julian F. Reschke" role="editor">
3259      <organization abbrev="greenbytes">greenbytes GmbH</organization>
3260      <address><email>julian.reschke@greenbytes.de</email></address>
3261    </author>
3262    <date month="&ID-MONTH;" year="&ID-YEAR;"/>
3263  </front>
3264  <seriesInfo name="Internet-Draft" value="draft-ietf-httpbis-p2-semantics-&ID-VERSION;"/>
3265  <x:source href="p2-semantics.xml" basename="p2-semantics"/>
3266</reference>
3267
3268<reference anchor="Part3">
3269  <front>
3270    <title abbrev="HTTP/1.1">HTTP/1.1, part 3: Message Payload and Content Negotiation</title>
3271    <author initials="R." surname="Fielding" fullname="Roy T. Fielding" role="editor">
3272      <organization abbrev="Day Software">Day Software</organization>
3273      <address><email>fielding@gbiv.com</email></address>
3274    </author>
3275    <author initials="J." surname="Gettys" fullname="Jim Gettys">
3276      <organization>One Laptop per Child</organization>
3277      <address><email>jg@laptop.org</email></address>
3278    </author>
3279    <author initials="J." surname="Mogul" fullname="Jeffrey C. Mogul">
3280      <organization abbrev="HP">Hewlett-Packard Company</organization>
3281      <address><email>JeffMogul@acm.org</email></address>
3282    </author>
3283    <author initials="H." surname="Frystyk" fullname="Henrik Frystyk Nielsen">
3284      <organization abbrev="Microsoft">Microsoft Corporation</organization>
3285      <address><email>henrikn@microsoft.com</email></address>
3286    </author>
3287    <author initials="L." surname="Masinter" fullname="Larry Masinter">
3288      <organization abbrev="Adobe Systems">Adobe Systems, Incorporated</organization>
3289      <address><email>LMM@acm.org</email></address>
3290    </author>
3291    <author initials="P." surname="Leach" fullname="Paul J. Leach">
3292      <organization abbrev="Microsoft">Microsoft Corporation</organization>
3293      <address><email>paulle@microsoft.com</email></address>
3294    </author>
3295    <author initials="T." surname="Berners-Lee" fullname="Tim Berners-Lee">
3296      <organization abbrev="W3C/MIT">World Wide Web Consortium</organization>
3297      <address><email>timbl@w3.org</email></address>
3298    </author>
3299    <author initials="Y." surname="Lafon" fullname="Yves Lafon" role="editor">
3300      <organization abbrev="W3C">World Wide Web Consortium</organization>
3301      <address><email>ylafon@w3.org</email></address>
3302    </author>
3303    <author initials="J. F." surname="Reschke" fullname="Julian F. Reschke" role="editor">
3304      <organization abbrev="greenbytes">greenbytes GmbH</organization>
3305      <address><email>julian.reschke@greenbytes.de</email></address>
3306    </author>
3307    <date month="&ID-MONTH;" year="&ID-YEAR;"/>
3308  </front>
3309  <seriesInfo name="Internet-Draft" value="draft-ietf-httpbis-p3-payload-&ID-VERSION;"/>
3310  <x:source href="p3-payload.xml" basename="p3-payload"/>
3311</reference>
3312
3313<reference anchor="Part5">
3314  <front>
3315    <title abbrev="HTTP/1.1">HTTP/1.1, part 5: Range Requests and Partial Responses</title>
3316    <author initials="R." surname="Fielding" fullname="Roy T. Fielding" role="editor">
3317      <organization abbrev="Day Software">Day Software</organization>
3318      <address><email>fielding@gbiv.com</email></address>
3319    </author>
3320    <author initials="J." surname="Gettys" fullname="Jim Gettys">
3321      <organization>One Laptop per Child</organization>
3322      <address><email>jg@laptop.org</email></address>
3323    </author>
3324    <author initials="J." surname="Mogul" fullname="Jeffrey C. Mogul">
3325      <organization abbrev="HP">Hewlett-Packard Company</organization>
3326      <address><email>JeffMogul@acm.org</email></address>
3327    </author>
3328    <author initials="H." surname="Frystyk" fullname="Henrik Frystyk Nielsen">
3329      <organization abbrev="Microsoft">Microsoft Corporation</organization>
3330      <address><email>henrikn@microsoft.com</email></address>
3331    </author>
3332    <author initials="L." surname="Masinter" fullname="Larry Masinter">
3333      <organization abbrev="Adobe Systems">Adobe Systems, Incorporated</organization>
3334      <address><email>LMM@acm.org</email></address>
3335    </author>
3336    <author initials="P." surname="Leach" fullname="Paul J. Leach">
3337      <organization abbrev="Microsoft">Microsoft Corporation</organization>
3338      <address><email>paulle@microsoft.com</email></address>
3339    </author>
3340    <author initials="T." surname="Berners-Lee" fullname="Tim Berners-Lee">
3341      <organization abbrev="W3C/MIT">World Wide Web Consortium</organization>
3342      <address><email>timbl@w3.org</email></address>
3343    </author>
3344    <author initials="Y." surname="Lafon" fullname="Yves Lafon" role="editor">
3345      <organization abbrev="W3C">World Wide Web Consortium</organization>
3346      <address><email>ylafon@w3.org</email></address>
3347    </author>
3348    <author initials="J. F." surname="Reschke" fullname="Julian F. Reschke" role="editor">
3349      <organization abbrev="greenbytes">greenbytes GmbH</organization>
3350      <address><email>julian.reschke@greenbytes.de</email></address>
3351    </author>
3352    <date month="&ID-MONTH;" year="&ID-YEAR;"/>
3353  </front>
3354  <seriesInfo name="Internet-Draft" value="draft-ietf-httpbis-p5-range-&ID-VERSION;"/>
3355  <x:source href="p5-range.xml" basename="p5-range"/>
3356</reference>
3357
3358<reference anchor="Part6">
3359  <front>
3360    <title abbrev="HTTP/1.1">HTTP/1.1, part 6: Caching</title>
3361    <author initials="R." surname="Fielding" fullname="Roy T. Fielding" role="editor">
3362      <organization abbrev="Day Software">Day Software</organization>
3363      <address><email>fielding@gbiv.com</email></address>
3364    </author>
3365    <author initials="J." surname="Gettys" fullname="Jim Gettys">
3366      <organization>One Laptop per Child</organization>
3367      <address><email>jg@laptop.org</email></address>
3368    </author>
3369    <author initials="J." surname="Mogul" fullname="Jeffrey C. Mogul">
3370      <organization abbrev="HP">Hewlett-Packard Company</organization>
3371      <address><email>JeffMogul@acm.org</email></address>
3372    </author>
3373    <author initials="H." surname="Frystyk" fullname="Henrik Frystyk Nielsen">
3374      <organization abbrev="Microsoft">Microsoft Corporation</organization>
3375      <address><email>henrikn@microsoft.com</email></address>
3376    </author>
3377    <author initials="L." surname="Masinter" fullname="Larry Masinter">
3378      <organization abbrev="Adobe Systems">Adobe Systems, Incorporated</organization>
3379      <address><email>LMM@acm.org</email></address>
3380    </author>
3381    <author initials="P." surname="Leach" fullname="Paul J. Leach">
3382      <organization abbrev="Microsoft">Microsoft Corporation</organization>
3383      <address><email>paulle@microsoft.com</email></address>
3384    </author>
3385    <author initials="T." surname="Berners-Lee" fullname="Tim Berners-Lee">
3386      <organization abbrev="W3C/MIT">World Wide Web Consortium</organization>
3387      <address><email>timbl@w3.org</email></address>
3388    </author>
3389    <author initials="Y." surname="Lafon" fullname="Yves Lafon" role="editor">
3390      <organization abbrev="W3C">World Wide Web Consortium</organization>
3391      <address><email>ylafon@w3.org</email></address>
3392    </author>
3393    <author initials="J. F." surname="Reschke" fullname="Julian F. Reschke" role="editor">
3394      <organization abbrev="greenbytes">greenbytes GmbH</organization>
3395      <address><email>julian.reschke@greenbytes.de</email></address>
3396    </author>
3397    <date month="&ID-MONTH;" year="&ID-YEAR;"/>
3398  </front>
3399  <seriesInfo name="Internet-Draft" value="draft-ietf-httpbis-p6-cache-&ID-VERSION;"/>
3400  <x:source href="p6-cache.xml" basename="p6-cache"/>
3401</reference>
3402
3403<reference anchor="RFC822ABNF">
3404  <front>
3405    <title abbrev="Standard for ARPA Internet Text Messages">Standard for the format of ARPA Internet text messages</title>
3406    <author initials="D.H." surname="Crocker" fullname="David H. Crocker">
3407      <organization>University of Delaware, Dept. of Electrical Engineering</organization>
3408      <address><email>DCrocker@UDel-Relay</email></address>
3409    </author>
3410    <date month="August" day="13" year="1982"/>
3411  </front>
3412  <seriesInfo name="STD" value="11"/>
3413  <seriesInfo name="RFC" value="822"/>
3414</reference>
3415
3416<reference anchor="RFC2045">
3417  <front>
3418    <title abbrev="Internet Message Bodies">Multipurpose Internet Mail Extensions (MIME) Part One: Format of Internet Message Bodies</title>
3419    <author initials="N." surname="Freed" fullname="Ned Freed">
3420      <organization>Innosoft International, Inc.</organization>
3421      <address><email>ned@innosoft.com</email></address>
3422    </author>
3423    <author initials="N.S." surname="Borenstein" fullname="Nathaniel S. Borenstein">
3424      <organization>First Virtual Holdings</organization>
3425      <address><email>nsb@nsb.fv.com</email></address>
3426    </author>
3427    <date month="November" year="1996"/>
3428  </front>
3429  <seriesInfo name="RFC" value="2045"/>
3430</reference>
3431
3432<reference anchor="RFC2047">
3433  <front>
3434    <title abbrev="Message Header Extensions">MIME (Multipurpose Internet Mail Extensions) Part Three: Message Header Extensions for Non-ASCII Text</title>
3435    <author initials="K." surname="Moore" fullname="Keith Moore">
3436      <organization>University of Tennessee</organization>
3437      <address><email>moore@cs.utk.edu</email></address>
3438    </author>
3439    <date month="November" year="1996"/>
3440  </front>
3441  <seriesInfo name="RFC" value="2047"/>
3442</reference>
3443
3444<reference anchor="RFC2119">
3445  <front>
3446    <title>Key words for use in RFCs to Indicate Requirement Levels</title>
3447    <author initials="S." surname="Bradner" fullname="Scott Bradner">
3448      <organization>Harvard University</organization>
3449      <address><email>sob@harvard.edu</email></address>
3450    </author>
3451    <date month="March" year="1997"/>
3452  </front>
3453  <seriesInfo name="BCP" value="14"/>
3454  <seriesInfo name="RFC" value="2119"/>
3455</reference>
3456
3457<reference anchor="RFC2396">
3458  <front>
3459    <title abbrev="URI Generic Syntax">Uniform Resource Identifiers (URI): Generic Syntax</title>
3460    <author initials="T." surname="Berners-Lee" fullname="Tim Berners-Lee">
3461      <organization abbrev="MIT/LCS">World Wide Web Consortium</organization>
3462      <address><email>timbl@w3.org</email></address>
3463    </author>
3464    <author initials="R.T." surname="Fielding" fullname="Roy T. Fielding">
3465      <organization abbrev="U.C. Irvine">Department of Information and Computer Science</organization>
3466      <address><email>fielding@ics.uci.edu</email></address>
3467    </author>
3468    <author initials="L." surname="Masinter" fullname="Larry Masinter">
3469      <organization abbrev="Xerox Corporation">Xerox PARC</organization>
3470      <address><email>masinter@parc.xerox.com</email></address>
3471    </author>
3472    <date month="August" year="1998"/>
3473  </front>
3474  <seriesInfo name="RFC" value="2396"/>
3475</reference>
3476
3477<reference anchor="USASCII">
3478  <front>
3479    <title>Coded Character Set -- 7-bit American Standard Code for Information Interchange</title>
3480    <author>
3481      <organization>American National Standards Institute</organization>
3482    </author>
3483    <date year="1986"/>
3484  </front>
3485  <seriesInfo name="ANSI" value="X3.4"/>
3486</reference>
3487
3488</references>
3489
3490<references title="Informative References">
3491
3492<reference anchor="Nie1997" target="http://doi.acm.org/10.1145/263105.263157">
3493  <front>
3494    <title>Network Performance Effects of HTTP/1.1, CSS1, and PNG</title>
3495    <author initials="H.F.." surname="Nielsen" fullname="H.F. Nielsen">
3496      <organization/>
3497    </author>
3498    <author initials="J." surname="Gettys" fullname="J. Gettys">
3499      <organization/>
3500    </author>
3501    <author initials="E." surname="Prud'hommeaux" fullname="E. Prud'hommeaux">
3502      <organization/>
3503    </author>
3504    <author initials="H." surname="Lie" fullname="H. Lie">
3505      <organization/>
3506    </author>
3507    <author initials="C." surname="Lilley" fullname="C. Lilley">
3508      <organization/>
3509    </author>
3510    <date year="1997" month="September"/>
3511  </front>
3512  <seriesInfo name="ACM" value="Proceedings of the ACM SIGCOMM '97 conference on Applications, technologies, architectures, and protocols for computer communication SIGCOMM '97"/>
3513</reference>
3514
3515<reference anchor="Pad1995">
3516  <front>
3517    <title>Improving HTTP Latency</title>
3518    <author initials="V.N." surname="Padmanabhan" fullname="Venkata N. Padmanabhan">
3519      <organization/>
3520    </author>
3521    <author initials="J.C." surname="Mogul" fullname="Jeffrey C. Mogul">
3522      <organization/>
3523    </author>
3524    <date year="1995" month="December"/>
3525  </front>
3526  <seriesInfo name="Computer Networks and ISDN Systems" value="v. 28, pp. 25-35"/>
3527  <annotation>
3528    Slightly revised version of paper in Proc. 2nd International WWW Conference '94: Mosaic and the Web, Oct. 1994,
3529    which is available at <eref target="http://www.ncsa.uiuc.edu/SDG/IT94/Proceedings/DDay/mogul/HTTPLatency.html"/>.
3530  </annotation>
3531</reference>
3532
3533<reference anchor="RFC822">
3534  <front>
3535    <title abbrev="Standard for ARPA Internet Text Messages">Standard for the format of ARPA Internet text messages</title>
3536    <author initials="D.H." surname="Crocker" fullname="David H. Crocker">
3537      <organization>University of Delaware, Dept. of Electrical Engineering</organization>
3538      <address><email>DCrocker@UDel-Relay</email></address>
3539    </author>
3540    <date month="August" day="13" year="1982"/>
3541  </front>
3542  <seriesInfo name="STD" value="11"/>
3543  <seriesInfo name="RFC" value="822"/>
3544</reference>
3545
3546<reference anchor="RFC959">
3547  <front>
3548    <title abbrev="File Transfer Protocol">File Transfer Protocol</title>
3549    <author initials="J." surname="Postel" fullname="J. Postel">
3550      <organization>Information Sciences Institute (ISI)</organization>
3551    </author>
3552    <author initials="J." surname="Reynolds" fullname="J. Reynolds">
3553      <organization/>
3554    </author>
3555    <date month="October" year="1985"/>
3556  </front>
3557  <seriesInfo name="STD" value="9"/>
3558  <seriesInfo name="RFC" value="959"/>
3559</reference>
3560
3561<reference anchor="RFC1123">
3562  <front>
3563    <title>Requirements for Internet Hosts - Application and Support</title>
3564    <author initials="R." surname="Braden" fullname="Robert Braden">
3565      <organization>University of Southern California (USC), Information Sciences Institute</organization>
3566      <address><email>Braden@ISI.EDU</email></address>
3567    </author>
3568    <date month="October" year="1989"/>
3569  </front>
3570  <seriesInfo name="STD" value="3"/>
3571  <seriesInfo name="RFC" value="1123"/>
3572</reference>
3573
3574<reference anchor="RFC1305">
3575  <front>
3576    <title>Network Time Protocol (Version 3) Specification, Implementation</title>
3577    <author initials="D." surname="Mills" fullname="David L. Mills">
3578      <organization>University of Delaware, Electrical Engineering Department</organization>
3579      <address><email>mills@udel.edu</email></address>
3580    </author>
3581    <date month="March" year="1992"/>
3582  </front>
3583  <seriesInfo name="RFC" value="1305"/>
3584</reference>
3585
3586<reference anchor="RFC1436">
3587  <front>
3588    <title abbrev="Gopher">The Internet Gopher Protocol (a distributed document search and retrieval protocol)</title>
3589    <author initials="F." surname="Anklesaria" fullname="Farhad Anklesaria">
3590      <organization>University of Minnesota, Computer and Information Services</organization>
3591      <address><email>fxa@boombox.micro.umn.edu</email></address>
3592    </author>
3593    <author initials="M." surname="McCahill" fullname="Mark McCahill">
3594      <organization>University of Minnesota, Computer and Information Services</organization>
3595      <address><email>mpm@boombox.micro.umn.edu</email></address>
3596    </author>
3597    <author initials="P." surname="Lindner" fullname="Paul Lindner">
3598      <organization>University of Minnesota, Computer and Information Services</organization>
3599      <address><email>lindner@boombox.micro.umn.edu</email></address>
3600    </author>
3601    <author initials="D." surname="Johnson" fullname="David Johnson">
3602      <organization>University of Minnesota, Computer and Information Services</organization>
3603      <address><email>dmj@boombox.micro.umn.edu</email></address>
3604    </author>
3605    <author initials="D." surname="Torrey" fullname="Daniel Torrey">
3606      <organization>University of Minnesota, Computer and Information Services</organization>
3607      <address><email>daniel@boombox.micro.umn.edu</email></address>
3608    </author>
3609    <author initials="B." surname="Alberti" fullname="Bob Alberti">
3610      <organization>University of Minnesota, Computer and Information Services</organization>
3611      <address><email>alberti@boombox.micro.umn.edu</email></address>
3612    </author>
3613    <date month="March" year="1993"/>
3614  </front>
3615  <seriesInfo name="RFC" value="1436"/>
3616</reference>
3617
3618<reference anchor="RFC1630">
3619  <front>
3620    <title abbrev="URIs in WWW">Universal Resource Identifiers in WWW: A Unifying Syntax for the Expression of Names and Addresses of Objects on the Network as used in the World-Wide Web</title>
3621    <author initials="T." surname="Berners-Lee" fullname="Tim Berners-Lee">
3622      <organization>CERN, World-Wide Web project</organization>
3623      <address><email>timbl@info.cern.ch</email></address>
3624    </author>
3625    <date month="June" year="1994"/>
3626  </front>
3627  <seriesInfo name="RFC" value="1630"/>
3628</reference>
3629
3630<reference anchor="RFC1737">
3631  <front>
3632    <title abbrev="Requirements for Uniform Resource Names">Functional Requirements for Uniform Resource Names</title>
3633    <author initials="L." surname="Masinter" fullname="Larry Masinter">
3634      <organization>Xerox Palo Alto Research Center</organization>
3635      <address><email>masinter@parc.xerox.com</email></address>
3636    </author>
3637    <author initials="K." surname="Sollins" fullname="Karen Sollins">
3638      <organization>MIT Laboratory for Computer Science</organization>
3639      <address><email>sollins@lcs.mit.edu</email></address>
3640    </author>
3641    <date month="December" year="1994"/>
3642  </front>
3643  <seriesInfo name="RFC" value="1737"/>
3644</reference>
3645
3646<reference anchor="RFC1738">
3647  <front>
3648    <title>Uniform Resource Locators (URL)</title>
3649    <author initials="T." surname="Berners-Lee" fullname="Tim Berners-Lee">
3650      <organization>CERN, World-Wide Web project</organization>
3651      <address><email>timbl@info.cern.ch</email></address>
3652    </author>
3653    <author initials="L." surname="Masinter" fullname="Larry Masinter">
3654      <organization>Xerox PARC</organization>
3655      <address><email>masinter@parc.xerox.com</email></address>
3656    </author>
3657    <author initials="M." surname="McCahill" fullname="Mark McCahill">
3658      <organization>University of Minnesota, Computer and Information Services</organization>
3659      <address><email>mpm@boombox.micro.umn.edu</email></address>
3660    </author>
3661    <date month="December" year="1994"/>
3662  </front>
3663  <seriesInfo name="RFC" value="1738"/>
3664</reference>
3665
3666<reference anchor="RFC1808">
3667  <front>
3668    <title>Relative Uniform Resource Locators</title>
3669    <author initials="R." surname="Fielding" fullname="Roy T. Fielding">
3670      <organization>University of California Irvine, Department of Information and Computer Science</organization>
3671      <address><email>fielding@ics.uci.edu</email></address>
3672    </author>
3673    <date month="June" year="1995"/>
3674  </front>
3675  <seriesInfo name="RFC" value="1808"/>
3676</reference>
3677
3678<reference anchor="RFC1900">
3679  <front>
3680    <title>Renumbering Needs Work</title>
3681    <author initials="B." surname="Carpenter" fullname="Brian E. Carpenter">
3682      <organization>CERN, Computing and Networks Division</organization>
3683      <address><email>brian@dxcoms.cern.ch</email></address>
3684    </author>
3685    <author initials="Y." surname="Rekhter" fullname="Yakov Rekhter">
3686      <organization>cisco Systems</organization>
3687      <address><email>yakov@cisco.com</email></address>
3688    </author>
3689    <date month="February" year="1996"/>
3690  </front>
3691  <seriesInfo name="RFC" value="1900"/>
3692</reference>
3693
3694<reference anchor="RFC1945">
3695  <front>
3696    <title abbrev="HTTP/1.0">Hypertext Transfer Protocol -- HTTP/1.0</title>
3697    <author initials="T." surname="Berners-Lee" fullname="Tim Berners-Lee">
3698      <organization>MIT, Laboratory for Computer Science</organization>
3699      <address><email>timbl@w3.org</email></address>
3700    </author>
3701    <author initials="R.T." surname="Fielding" fullname="Roy T. Fielding">
3702      <organization>University of California, Irvine, Department of Information and Computer Science</organization>
3703      <address><email>fielding@ics.uci.edu</email></address>
3704    </author>
3705    <author initials="H.F." surname="Nielsen" fullname="Henrik Frystyk Nielsen">
3706      <organization>W3 Consortium, MIT Laboratory for Computer Science</organization>
3707      <address><email>frystyk@w3.org</email></address>
3708    </author>
3709    <date month="May" year="1996"/>
3710  </front>
3711  <seriesInfo name="RFC" value="1945"/>
3712</reference>
3713
3714<reference anchor="RFC2068">
3715  <front>
3716    <title abbrev="HTTP/1.1">Hypertext Transfer Protocol -- HTTP/1.1</title>
3717    <author initials="R." surname="Fielding" fullname="Roy T. Fielding">
3718      <organization>University of California, Irvine, Department of Information and Computer Science</organization>
3719      <address><email>fielding@ics.uci.edu</email></address>
3720    </author>
3721    <author initials="J." surname="Gettys" fullname="Jim Gettys">
3722      <organization>MIT Laboratory for Computer Science</organization>
3723      <address><email>jg@w3.org</email></address>
3724    </author>
3725    <author initials="J." surname="Mogul" fullname="Jeffrey C. Mogul">
3726      <organization>Digital Equipment Corporation, Western Research Laboratory</organization>
3727      <address><email>mogul@wrl.dec.com</email></address>
3728    </author>
3729    <author initials="H." surname="Nielsen" fullname="Henrik Frystyk Nielsen">
3730      <organization>MIT Laboratory for Computer Science</organization>
3731      <address><email>frystyk@w3.org</email></address>
3732    </author>
3733    <author initials="T." surname="Berners-Lee" fullname="Tim Berners-Lee">
3734      <organization>MIT Laboratory for Computer Science</organization>
3735      <address><email>timbl@w3.org</email></address>
3736    </author>
3737    <date month="January" year="1997"/>
3738  </front>
3739  <seriesInfo name="RFC" value="2068"/>
3740</reference>
3741
3742<reference anchor="RFC2145">
3743  <front>
3744    <title abbrev="HTTP Version Numbers">Use and Interpretation of HTTP Version Numbers</title>
3745    <author initials="J.C." surname="Mogul" fullname="Jeffrey C. Mogul">
3746      <organization>Western Research Laboratory</organization>
3747      <address><email>mogul@wrl.dec.com</email></address>
3748    </author>
3749    <author initials="R.T." surname="Fielding" fullname="Roy T. Fielding">
3750      <organization>Department of Information and Computer Science</organization>
3751      <address><email>fielding@ics.uci.edu</email></address>
3752    </author>
3753    <author initials="J." surname="Gettys" fullname="Jim Gettys">
3754      <organization>MIT Laboratory for Computer Science</organization>
3755      <address><email>jg@w3.org</email></address>
3756    </author>
3757    <author initials="H.F." surname="Nielsen" fullname="Henrik Frystyk Nielsen">
3758      <organization>W3 Consortium</organization>
3759      <address><email>frystyk@w3.org</email></address>
3760    </author>
3761    <date month="May" year="1997"/>
3762  </front>
3763  <seriesInfo name="RFC" value="2145"/>
3764</reference>
3765
3766<reference anchor="RFC2324">
3767  <front>
3768    <title abbrev="HTCPCP/1.0">Hyper Text Coffee Pot Control Protocol (HTCPCP/1.0)</title>
3769    <author initials="L." surname="Masinter" fullname="Larry Masinter">
3770      <organization>Xerox Palo Alto Research Center</organization>
3771      <address><email>masinter@parc.xerox.com</email></address>
3772    </author>
3773    <date month="April" day="1" year="1998"/>
3774  </front>
3775  <seriesInfo name="RFC" value="2324"/>
3776</reference>
3777
3778<reference anchor="RFC2616">
3779  <front>
3780    <title>Hypertext Transfer Protocol -- HTTP/1.1</title>
3781    <author initials="R." surname="Fielding" fullname="R. Fielding">
3782      <organization>University of California, Irvine</organization>
3783      <address><email>fielding@ics.uci.edu</email></address>
3784    </author>
3785    <author initials="J." surname="Gettys" fullname="J. Gettys">
3786      <organization>W3C</organization>
3787      <address><email>jg@w3.org</email></address>
3788    </author>
3789    <author initials="J." surname="Mogul" fullname="J. Mogul">
3790      <organization>Compaq Computer Corporation</organization>
3791      <address><email>mogul@wrl.dec.com</email></address>
3792    </author>
3793    <author initials="H." surname="Frystyk" fullname="H. Frystyk">
3794      <organization>MIT Laboratory for Computer Science</organization>
3795      <address><email>frystyk@w3.org</email></address>
3796    </author>
3797    <author initials="L." surname="Masinter" fullname="L. Masinter">
3798      <organization>Xerox Corporation</organization>
3799      <address><email>masinter@parc.xerox.com</email></address>
3800    </author>
3801    <author initials="P." surname="Leach" fullname="P. Leach">
3802      <organization>Microsoft Corporation</organization>
3803      <address><email>paulle@microsoft.com</email></address>
3804    </author>
3805    <author initials="T." surname="Berners-Lee" fullname="T. Berners-Lee">
3806      <organization>W3C</organization>
3807      <address><email>timbl@w3.org</email></address>
3808    </author>
3809    <date month="June" year="1999"/>
3810  </front>
3811  <seriesInfo name="RFC" value="2616"/>
3812</reference>
3813
3814<reference anchor="RFC2821">
3815  <front>
3816    <title>Simple Mail Transfer Protocol</title>
3817    <author initials="J." surname="Klensin" fullname="J. Klensin">
3818      <organization>AT&amp;T Laboratories</organization>
3819      <address><email>klensin@research.att.com</email></address>
3820    </author>
3821    <date year="2001" month="April"/>
3822  </front>
3823  <seriesInfo name="RFC" value="2821"/>
3824</reference>
3825
3826<reference anchor="RFC2822">
3827  <front>
3828    <title>Internet Message Format</title>
3829    <author initials="P." surname="Resnick" fullname="P. Resnick">
3830      <organization>QUALCOMM Incorporated</organization>
3831    </author>
3832    <date year="2001" month="April"/>
3833  </front> 
3834  <seriesInfo name="RFC" value="2822"/>
3835</reference>
3836
3837<reference anchor='RFC3864'>
3838  <front>
3839    <title>Registration Procedures for Message Header Fields</title>
3840    <author initials='G.' surname='Klyne' fullname='G. Klyne'>
3841      <organization>Nine by Nine</organization>
3842      <address><email>GK-IETF@ninebynine.org</email></address>
3843    </author>
3844    <author initials='M.' surname='Nottingham' fullname='M. Nottingham'>
3845      <organization>BEA Systems</organization>
3846      <address><email>mnot@pobox.com</email></address>
3847    </author>
3848    <author initials='J.' surname='Mogul' fullname='J. Mogul'>
3849      <organization>HP Labs</organization>
3850      <address><email>JeffMogul@acm.org</email></address>
3851    </author>
3852    <date year='2004' month='September' />
3853  </front>
3854  <seriesInfo name='BCP' value='90' />
3855  <seriesInfo name='RFC' value='3864' />
3856</reference>
3857
3858<reference anchor='RFC3977'>
3859  <front>
3860    <title>Network News Transfer Protocol (NNTP)</title>
3861    <author initials='C.' surname='Feather' fullname='C. Feather'>
3862      <organization>THUS plc</organization>
3863      <address><email>clive@demon.net</email></address>
3864    </author>
3865    <date year='2006' month='October' />
3866  </front>
3867  <seriesInfo name="RFC" value="3977"/>
3868</reference>
3869
3870<reference anchor="RFC4288">
3871  <front>
3872    <title>Media Type Specifications and Registration Procedures</title>
3873    <author initials="N." surname="Freed" fullname="N. Freed">
3874      <organization>Sun Microsystems</organization>
3875      <address>
3876        <email>ned.freed@mrochek.com</email>
3877      </address>
3878    </author>
3879    <author initials="J." surname="Klensin" fullname="J. Klensin">
3880      <organization/>
3881      <address>
3882        <email>klensin+ietf@jck.com</email>
3883      </address>
3884    </author>
3885    <date year="2005" month="December"/>
3886  </front>
3887  <seriesInfo name="BCP" value="13"/>
3888  <seriesInfo name="RFC" value="4288"/>
3889</reference>
3890
3891<reference anchor="Spe" target="http://sunsite.unc.edu/mdma-release/http-prob.html">
3892  <front>
3893  <title>Analysis of HTTP Performance Problems</title>
3894  <author initials="S." surname="Spero" fullname="Simon E. Spero">
3895    <organization/>
3896  </author>
3897  <date/>
3898  </front>
3899</reference>
3900
3901<reference anchor="Tou1998" target="http://www.isi.edu/touch/pubs/http-perf96/">
3902  <front>
3903  <title>Analysis of HTTP Performance</title>
3904  <author initials="J." surname="Touch" fullname="Joe Touch">
3905    <organization>USC/Information Sciences Institute</organization>
3906    <address><email>touch@isi.edu</email></address>
3907  </author>
3908  <author initials="J." surname="Heidemann" fullname="John Heidemann">
3909    <organization>USC/Information Sciences Institute</organization>
3910    <address><email>johnh@isi.edu</email></address>
3911  </author>
3912  <author initials="K." surname="Obraczka" fullname="Katia Obraczka">
3913    <organization>USC/Information Sciences Institute</organization>
3914    <address><email>katia@isi.edu</email></address>
3915  </author>
3916  <date year="1998" month="Aug"/>
3917  </front>
3918  <seriesInfo name="ISI Research Report" value="ISI/RR-98-463"/>
3919  <annotation>(original report dated Aug. 1996)</annotation>
3920</reference>
3921
3922<reference anchor="WAIS">
3923  <front>
3924    <title>WAIS Interface Protocol Prototype Functional Specification (v1.5)</title>
3925    <author initials="F." surname="Davis" fullname="F. Davis">
3926      <organization>Thinking Machines Corporation</organization>
3927    </author>
3928    <author initials="B." surname="Kahle" fullname="B. Kahle">
3929      <organization>Thinking Machines Corporation</organization>
3930    </author>
3931    <author initials="H." surname="Morris" fullname="H. Morris">
3932      <organization>Thinking Machines Corporation</organization>
3933    </author>
3934    <author initials="J." surname="Salem" fullname="J. Salem">
3935      <organization>Thinking Machines Corporation</organization>
3936    </author>
3937    <author initials="T." surname="Shen" fullname="T. Shen">
3938      <organization>Thinking Machines Corporation</organization>
3939    </author>
3940    <author initials="R." surname="Wang" fullname="R. Wang">
3941      <organization>Thinking Machines Corporation</organization>
3942    </author>
3943    <author initials="J." surname="Sui" fullname="J. Sui">
3944      <organization>Thinking Machines Corporation</organization>
3945    </author>
3946    <author initials="M." surname="Grinbaum" fullname="M. Grinbaum">
3947      <organization>Thinking Machines Corporation</organization>
3948    </author>
3949    <date month="April" year="1990"/>
3950  </front>
3951  <seriesInfo name="Thinking Machines Corporation" value=""/>
3952</reference>
3953
3954</references>
3955
3956
3957<section title="Internet Media Types" anchor="internet.media.type.http">
3958<t>
3959   In addition to defining HTTP/1.1, this document serves
3960   as the specification for the Internet media type "message/http" and
3961   "application/http". The following is to be registered with IANA <xref target="RFC4288"/>.
3962</t>
3963<section title="Internet Media Type message/http" anchor="internet.media.type.message.http">
3964<iref item="Media Type" subitem="message/http" primary="true"/>
3965<iref item="message/http Media Type" primary="true"/>
3966<t>
3967   The message/http type can be used to enclose a single HTTP request or
3968   response message, provided that it obeys the MIME restrictions for all
3969   "message" types regarding line length and encodings.
3970</t>
3971<t>
3972  <list style="hanging" x:indent="12em">
3973    <t hangText="Type name:">
3974      message
3975    </t>
3976    <t hangText="Subtype name:">
3977      http
3978    </t>
3979    <t hangText="Required parameters:">
3980      none
3981    </t>
3982    <t hangText="Optional parameters:">
3983      version, msgtype
3984      <list style="hanging">
3985        <t hangText="version:">
3986          The HTTP-Version number of the enclosed message
3987          (e.g., "1.1"). If not present, the version can be
3988          determined from the first line of the body.
3989        </t>
3990        <t hangText="msgtype:">
3991          The message type -- "request" or "response". If not
3992          present, the type can be determined from the first
3993          line of the body.
3994        </t>
3995      </list>
3996    </t>
3997    <t hangText="Encoding considerations:">
3998      only "7bit", "8bit", or "binary" are permitted
3999    </t>
4000    <t hangText="Security considerations:">
4001      none
4002    </t>
4003    <t hangText="Interoperability considerations:">
4004      none
4005    </t>
4006    <t hangText="Published specification:">
4007      This specification (see <xref target="internet.media.type.message.http"/>).
4008    </t>
4009    <t hangText="Applications that use this media type:">
4010    </t>
4011    <t hangText="Additional information:">
4012      <list style="hanging">
4013        <t hangText="Magic number(s):">none</t>
4014        <t hangText="File extension(s):">none</t>
4015        <t hangText="Macintosh file type code(s):">none</t>
4016      </list>
4017    </t>
4018    <t hangText="Person and email address to contact for further information:">
4019      See Authors Section.
4020    </t>
4021                <t hangText="Intended usage:">
4022                  COMMON
4023    </t>
4024                <t hangText="Restrictions on usage:">
4025                  none
4026    </t>
4027    <t hangText="Author/Change controller:">
4028      IESG
4029    </t>
4030  </list>
4031</t>
4032</section>
4033<section title="Internet Media Type application/http" anchor="internet.media.type.application.http">
4034<iref item="Media Type" subitem="application/http" primary="true"/>
4035<iref item="application/http Media Type" primary="true"/>
4036<t>
4037   The application/http type can be used to enclose a pipeline of one or more
4038   HTTP request or response messages (not intermixed).
4039</t>
4040<t>
4041  <list style="hanging" x:indent="12em">
4042    <t hangText="Type name:">
4043      application
4044    </t>
4045    <t hangText="Subtype name:">
4046      http
4047    </t>
4048    <t hangText="Required parameters:">
4049      none
4050    </t>
4051    <t hangText="Optional parameters:">
4052      version, msgtype
4053      <list style="hanging">
4054        <t hangText="version:">
4055          The HTTP-Version number of the enclosed messages
4056          (e.g., "1.1"). If not present, the version can be
4057          determined from the first line of the body.
4058        </t>
4059        <t hangText="msgtype:">
4060          The message type -- "request" or "response". If not
4061          present, the type can be determined from the first
4062          line of the body.
4063        </t>
4064      </list>
4065    </t>
4066    <t hangText="Encoding considerations:">
4067      HTTP messages enclosed by this type
4068      are in "binary" format; use of an appropriate
4069      Content-Transfer-Encoding is required when
4070      transmitted via E-mail.
4071    </t>
4072    <t hangText="Security considerations:">
4073      none
4074    </t>
4075    <t hangText="Interoperability considerations:">
4076      none
4077    </t>
4078    <t hangText="Published specification:">
4079      This specification (see <xref target="internet.media.type.application.http"/>).
4080    </t>
4081    <t hangText="Applications that use this media type:">
4082    </t>
4083    <t hangText="Additional information:">
4084      <list style="hanging">
4085        <t hangText="Magic number(s):">none</t>
4086        <t hangText="File extension(s):">none</t>
4087        <t hangText="Macintosh file type code(s):">none</t>
4088      </list>
4089    </t>
4090    <t hangText="Person and email address to contact for further information:">
4091      See Authors Section.
4092    </t>
4093                <t hangText="Intended usage:">
4094                  COMMON
4095    </t>
4096                <t hangText="Restrictions on usage:">
4097                  none
4098    </t>
4099    <t hangText="Author/Change controller:">
4100      IESG
4101    </t>
4102  </list>
4103</t>
4104</section>
4105</section>
4106
4107<section title="Tolerant Applications" anchor="tolerant.applications">
4108<t>
4109   Although this document specifies the requirements for the generation
4110   of HTTP/1.1 messages, not all applications will be correct in their
4111   implementation. We therefore recommend that operational applications
4112   be tolerant of deviations whenever those deviations can be
4113   interpreted unambiguously.
4114</t>
4115<t>
4116   Clients &SHOULD; be tolerant in parsing the Status-Line and servers
4117   tolerant when parsing the Request-Line. In particular, they &SHOULD;
4118   accept any amount of SP or HTAB characters between fields, even though
4119   only a single SP is required.
4120</t>
4121<t>
4122   The line terminator for message-header fields is the sequence CRLF.
4123   However, we recommend that applications, when parsing such headers,
4124   recognize a single LF as a line terminator and ignore the leading CR.
4125</t>
4126<t>
4127   The character set of an entity-body &SHOULD; be labeled as the lowest
4128   common denominator of the character codes used within that body, with
4129   the exception that not labeling the entity is preferred over labeling
4130   the entity with the labels US-ASCII or ISO-8859-1. See &payload;.
4131</t>
4132<t>
4133   Additional rules for requirements on parsing and encoding of dates
4134   and other potential problems with date encodings include:
4135</t>
4136<t>
4137  <list style="symbols">
4138     <t>HTTP/1.1 clients and caches &SHOULD; assume that an RFC-850 date
4139        which appears to be more than 50 years in the future is in fact
4140        in the past (this helps solve the "year 2000" problem).</t>
4141
4142     <t>An HTTP/1.1 implementation &MAY; internally represent a parsed
4143        Expires date as earlier than the proper value, but &MUST-NOT;
4144        internally represent a parsed Expires date as later than the
4145        proper value.</t>
4146
4147     <t>All expiration-related calculations &MUST; be done in GMT. The
4148        local time zone &MUST-NOT; influence the calculation or comparison
4149        of an age or expiration time.</t>
4150
4151     <t>If an HTTP header incorrectly carries a date value with a time
4152        zone other than GMT, it &MUST; be converted into GMT using the
4153        most conservative possible conversion.</t>
4154  </list>
4155</t>
4156</section>
4157
4158<section title="Conversion of Date Formats" anchor="conversion.of.date.formats">
4159<t>
4160   HTTP/1.1 uses a restricted set of date formats (<xref target="full.date"/>) to
4161   simplify the process of date comparison. Proxies and gateways from
4162   other protocols &SHOULD; ensure that any Date header field present in a
4163   message conforms to one of the HTTP/1.1 formats and rewrite the date
4164   if necessary.
4165</t>
4166</section>
4167
4168<section title="Compatibility with Previous Versions" anchor="compatibility">
4169<t>
4170   It is beyond the scope of a protocol specification to mandate
4171   compliance with previous versions. HTTP/1.1 was deliberately
4172   designed, however, to make supporting previous versions easy. It is
4173   worth noting that, at the time of composing this specification
4174   (1996), we would expect commercial HTTP/1.1 servers to:
4175  <list style="symbols">
4176     <t>recognize the format of the Request-Line for HTTP/0.9, 1.0, and
4177        1.1 requests;</t>
4178
4179     <t>understand any valid request in the format of HTTP/0.9, 1.0, or
4180        1.1;</t>
4181
4182     <t>respond appropriately with a message in the same major version
4183        used by the client.</t>
4184  </list>
4185</t>
4186<t>
4187   And we would expect HTTP/1.1 clients to:
4188  <list style="symbols">
4189     <t>recognize the format of the Status-Line for HTTP/1.0 and 1.1
4190        responses;</t>
4191
4192     <t>understand any valid response in the format of HTTP/0.9, 1.0, or
4193        1.1.</t>
4194  </list>
4195</t>
4196<t>
4197   For most implementations of HTTP/1.0, each connection is established
4198   by the client prior to the request and closed by the server after
4199   sending the response. Some implementations implement the Keep-Alive
4200   version of persistent connections described in <xref x:sec="19.7.1" x:fmt="of" target="RFC2068"/>.
4201</t>
4202
4203<section title="Changes from HTTP/1.0" anchor="changes.from.1.0">
4204<t>
4205   This section summarizes major differences between versions HTTP/1.0
4206   and HTTP/1.1.
4207</t>
4208
4209<section title="Changes to Simplify Multi-homed Web Servers and Conserve IP Addresses" anchor="changes.to.simplify.multi-homed.web.servers.and.conserve.ip.addresses">
4210<t>
4211   The requirements that clients and servers support the Host request-header,
4212   report an error if the Host request-header (<xref target="header.host"/>) is
4213   missing from an HTTP/1.1 request, and accept absolute URIs (<xref target="request-uri"/>)
4214   are among the most important changes defined by this
4215   specification.
4216</t>
4217<t>
4218   Older HTTP/1.0 clients assumed a one-to-one relationship of IP
4219   addresses and servers; there was no other established mechanism for
4220   distinguishing the intended server of a request than the IP address
4221   to which that request was directed. The changes outlined above will
4222   allow the Internet, once older HTTP clients are no longer common, to
4223   support multiple Web sites from a single IP address, greatly
4224   simplifying large operational Web servers, where allocation of many
4225   IP addresses to a single host has created serious problems. The
4226   Internet will also be able to recover the IP addresses that have been
4227   allocated for the sole purpose of allowing special-purpose domain
4228   names to be used in root-level HTTP URLs. Given the rate of growth of
4229   the Web, and the number of servers already deployed, it is extremely
4230   important that all implementations of HTTP (including updates to
4231   existing HTTP/1.0 applications) correctly implement these
4232   requirements:
4233  <list style="symbols">
4234     <t>Both clients and servers &MUST; support the Host request-header.</t>
4235
4236     <t>A client that sends an HTTP/1.1 request &MUST; send a Host header.</t>
4237
4238     <t>Servers &MUST; report a 400 (Bad Request) error if an HTTP/1.1
4239        request does not include a Host request-header.</t>
4240
4241     <t>Servers &MUST; accept absolute URIs.</t>
4242  </list>
4243</t>
4244</section>
4245</section>
4246
4247<section title="Compatibility with HTTP/1.0 Persistent Connections" anchor="compatibility.with.http.1.0.persistent.connections">
4248<t>
4249   Some clients and servers might wish to be compatible with some
4250   previous implementations of persistent connections in HTTP/1.0
4251   clients and servers. Persistent connections in HTTP/1.0 are
4252   explicitly negotiated as they are not the default behavior. HTTP/1.0
4253   experimental implementations of persistent connections are faulty,
4254   and the new facilities in HTTP/1.1 are designed to rectify these
4255   problems. The problem was that some existing 1.0 clients may be
4256   sending Keep-Alive to a proxy server that doesn't understand
4257   Connection, which would then erroneously forward it to the next
4258   inbound server, which would establish the Keep-Alive connection and
4259   result in a hung HTTP/1.0 proxy waiting for the close on the
4260   response. The result is that HTTP/1.0 clients must be prevented from
4261   using Keep-Alive when talking to proxies.
4262</t>
4263<t>
4264   However, talking to proxies is the most important use of persistent
4265   connections, so that prohibition is clearly unacceptable. Therefore,
4266   we need some other mechanism for indicating a persistent connection
4267   is desired, which is safe to use even when talking to an old proxy
4268   that ignores Connection. Persistent connections are the default for
4269   HTTP/1.1 messages; we introduce a new keyword (Connection: close) for
4270   declaring non-persistence. See <xref target="header.connection"/>.
4271</t>
4272<t>
4273   The original HTTP/1.0 form of persistent connections (the Connection:
4274   Keep-Alive and Keep-Alive header) is documented in <xref target="RFC2068"/>.
4275</t>
4276</section>
4277
4278<section title="Changes from RFC 2068" anchor="changes.from.rfc.2068">
4279<t>
4280   This specification has been carefully audited to correct and
4281   disambiguate key word usage; RFC 2068 had many problems in respect to
4282   the conventions laid out in <xref target="RFC2119"/>.
4283</t>
4284<t>
4285   Transfer-coding and message lengths all interact in ways that
4286   required fixing exactly when chunked encoding is used (to allow for
4287   transfer encoding that may not be self delimiting); it was important
4288   to straighten out exactly how message lengths are computed. (Sections
4289   <xref target="transfer.codings" format="counter"/>, <xref target="message.length" format="counter"/>,
4290   <xref target="header.content-length" format="counter"/>,
4291   see also <xref target="Part3"/>, <xref target="Part5"/> and <xref target="Part6"/>)
4292</t>
4293<t>
4294   The use and interpretation of HTTP version numbers has been clarified
4295   by <xref target="RFC2145"/>. Require proxies to upgrade requests to highest protocol
4296   version they support to deal with problems discovered in HTTP/1.0
4297   implementations (<xref target="http.version"/>)
4298</t>
4299<t>
4300   Transfer-coding had significant problems, particularly with
4301   interactions with chunked encoding. The solution is that transfer-codings
4302   become as full fledged as content-codings. This involves
4303   adding an IANA registry for transfer-codings (separate from content
4304   codings), a new header field (TE) and enabling trailer headers in the
4305   future. Transfer encoding is a major performance benefit, so it was
4306   worth fixing <xref target="Nie1997"/>. TE also solves another, obscure, downward
4307   interoperability problem that could have occurred due to interactions
4308   between authentication trailers, chunked encoding and HTTP/1.0
4309   clients.(Section <xref target="transfer.codings" format="counter"/>, <xref target="chunked.transfer.encoding" format="counter"/>,
4310   and <xref target="header.te" format="counter"/>)
4311</t>
4312</section>
4313
4314<section title="Changes from RFC 2616" anchor="changes.from.rfc.2616">
4315<t>
4316  The CHAR rule does not allow the NUL character anymore (this affects
4317  the comment and quoted-string rules).  Furthermore, the quoted-pair
4318  rule does not allow escaping NUL, CR or LF anymore.
4319  (<xref target="basic.rules"/>)
4320</t>
4321<t>
4322  Clarify that HTTP-Version is case sensitive.
4323  (<xref target="http.version"/>)
4324</t>
4325<t>
4326  Remove reference to non-existant identity transfer-coding value tokens.
4327  (Sections <xref format="counter" target="transfer.codings"/> and
4328  <xref format="counter" target="message.length"/>)
4329</t>
4330<t>
4331  Clarification that the chunk length does not include
4332  the count of the octets in the chunk header and trailer.
4333  (<xref target="chunked.transfer.encoding"/>)
4334</t>
4335<t>
4336  Fix BNF to add query, as the abs_path production in
4337  <xref x:sec="3" x:fmt="of" target="RFC2396"/> doesn't define it.
4338  (<xref target="request-uri"/>)
4339</t>
4340<t>
4341  Clarify exactly when close connection options must be sent.
4342  (<xref target="header.connection"/>)
4343</t>
4344</section>
4345</section>
4346
4347<section title="Change Log (to be removed by RFC Editor before publication)" anchor="change.log">
4348
4349<section title="Since RFC2616">
4350<t>
4351  Extracted relevant partitions from <xref target="RFC2616"/>.
4352</t>
4353</section>
4354
4355<section title="Since draft-ietf-httpbis-p1-messaging-00">
4356<t>
4357  Closed issues:
4358  <list style="symbols"> 
4359    <t>
4360      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/1"/>:
4361      "HTTP Version should be case sensitive"
4362      (<eref target="http://purl.org/NET/http-errata#verscase"/>)
4363    </t>
4364    <t>
4365      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/2"/>:
4366      "'unsafe' characters"
4367      (<eref target="http://purl.org/NET/http-errata#unsafe-uri"/>)
4368    </t>
4369    <t>
4370      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/3"/>:
4371      "Chunk Size Definition"
4372      (<eref target="http://purl.org/NET/http-errata#chunk-size"/>)
4373    </t>
4374    <t>
4375      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/4"/>:
4376      "Message Length"
4377      (<eref target="http://purl.org/NET/http-errata#msg-len-chars"/>)
4378    </t>
4379    <t>
4380      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/8"/>:
4381      "Media Type Registrations"
4382      (<eref target="http://purl.org/NET/http-errata#media-reg"/>)
4383    </t>
4384    <t>
4385      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/11"/>:
4386      "URI includes query"
4387      (<eref target="http://purl.org/NET/http-errata#uriquery"/>)
4388    </t>
4389    <t>
4390      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/15"/>:
4391      "No close on 1xx responses"
4392      (<eref target="http://purl.org/NET/http-errata#noclose1xx"/>)
4393    </t>
4394    <t>
4395      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/16"/>:
4396      "Remove 'identity' token references"
4397      (<eref target="http://purl.org/NET/http-errata#identity"/>)
4398    </t>
4399    <t>
4400      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/26"/>:
4401      "Import query BNF"
4402    </t>
4403    <t>
4404      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/31"/>:
4405      "qdtext BNF"
4406    </t>
4407    <t>
4408      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/35"/>:
4409      "Normative and Informative references"
4410    </t>
4411    <t>
4412      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/42"/>:
4413      "RFC2606 Compliance"
4414    </t>
4415    <t>
4416      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/45"/>:
4417      "RFC977 reference"
4418    </t>
4419    <t>
4420      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/46"/>:
4421      "RFC1700 references"
4422    </t>
4423    <t>
4424      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/47"/>:
4425      "inconsistency in date format explanation"
4426    </t>
4427    <t>
4428      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/48"/>:
4429      "Date reference typo"
4430    </t>
4431    <t>
4432      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/65"/>:
4433      "Informative references"
4434    </t>
4435    <t>
4436      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/66"/>:
4437      "ISO-8859-1 Reference"
4438    </t>
4439    <t>
4440      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/86"/>:
4441      "Normative up-to-date references"
4442    </t>
4443  </list>
4444</t>
4445<t>
4446  Other changes:
4447  <list style="symbols"> 
4448    <t>
4449      Update media type registrations to use RFC4288 template.
4450    </t>
4451    <t>
4452      Use names of RFC4234 core rules DQUOTE and HTAB,
4453      fix broken ABNF for chunk-data
4454      (work in progress on <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/36"/>)
4455    </t>
4456  </list>
4457</t>
4458</section>
4459
4460<section title="Since draft-ietf-httpbis-p1-messaging-01">
4461<t>
4462  Closed issues:
4463  <list style="symbols"> 
4464    <t>
4465      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/19"/>:
4466      "Bodies on GET (and other) requests"
4467    </t>
4468    <t>
4469      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/55"/>:
4470      "Updating to RFC4288"
4471    </t>
4472    <t>
4473      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/57"/>:
4474      "Status Code and Reason Phrase"
4475    </t>
4476    <t>
4477      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/82"/>:
4478      "rel_path not used"
4479    </t>
4480  </list>
4481</t>
4482<t>
4483  Ongoing work on ABNF conversion (<eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/36"/>):
4484  <list style="symbols"> 
4485    <t>
4486      Get rid of duplicate BNF rule names ("host" -> "uri-host", "trailer" ->
4487      "trailer-part").
4488    </t>
4489    <t>
4490      Avoid underscore character in rule names ("http_URL" ->
4491      "http-URL", "abs_path" -> "path-absolute").
4492    </t>
4493    <t>
4494      Add rules for terms imported from URI spec ("absoluteURI", "authority",
4495      "path-absolute", "port", "query", "relativeURI", "host) -- these will
4496      have to be updated when switching over to RFC3986.
4497    </t>
4498    <t>
4499      Synchronize core rules with RFC5234 (this includes a change to CHAR
4500      which now excludes NUL).
4501    </t>
4502    <t>
4503      Get rid of prose rules that span multiple lines.
4504    </t>
4505    <t>
4506      Get rid of unused rules LOALPHA and UPALPHA.
4507    </t>
4508    <t>
4509      Move "Product Tokens" section (back) into Part 1, as "token" is used
4510      in the definition of the Upgrade header.
4511    </t>
4512    <t>
4513      Add explicit references to BNF syntax and rules imported from other parts of the specification.
4514    </t>
4515    <t>
4516      Rewrite prose rule "token" in terms of "tchar", rewrite prose rule "TEXT".
4517    </t>
4518  </list>
4519</t>
4520</section>
4521
4522<section title="Since draft-ietf-httpbis-p1-messaging-02" anchor="changes.since.02">
4523<t>
4524  Closed issues:
4525  <list style="symbols"> 
4526    <t>
4527      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/51"/>:
4528      "HTTP-date vs. rfc1123-date"
4529    </t>
4530    <t>
4531      <eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/64"/>:
4532      "WS in quoted-pair"
4533    </t>
4534  </list>
4535</t>
4536<t>
4537  Ongoing work on IANA Message Header Registration (<eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/40"/>):
4538  <list style="symbols"> 
4539    <t>
4540      Reference RFC 3984, and update header registrations for headers defined
4541      in this document.
4542    </t>
4543  </list>
4544</t>
4545<t>
4546  Ongoing work on ABNF conversion (<eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/36"/>):
4547  <list style="symbols"> 
4548    <t>
4549      Replace string literals when the string really is case-sensitive (HTTP-Version).
4550    </t>
4551  </list>
4552</t>
4553</section>
4554
4555<section title="Since draft-ietf-httpbis-p1-messaging-03" anchor="changes.since.03">
4556<t>
4557  Ongoing work on ABNF conversion (<eref target="http://www3.tools.ietf.org/wg/httpbis/trac/ticket/36"/>):
4558  <list style="symbols"> 
4559    <t>
4560      Replace string literals when the string really is case-sensitive (HTTP-Date).
4561    </t>
4562  </list>
4563</t>
4564</section>
4565
4566</section>
4567
4568</back>
4569</rfc>
Note: See TracBrowser for help on using the repository browser.