• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // Copyright (c) 2006-2009 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4 
5 #ifndef NET_HTTP_HTTP_RESPONSE_HEADERS_H_
6 #define NET_HTTP_HTTP_RESPONSE_HEADERS_H_
7 
8 #include <string>
9 #include <vector>
10 
11 #include "base/basictypes.h"
12 #include "base/hash_tables.h"
13 #include "base/ref_counted.h"
14 #include "net/http/http_version.h"
15 
16 class Pickle;
17 
18 namespace base {
19 class Time;
20 class TimeDelta;
21 }
22 
23 namespace net {
24 
25 // HttpResponseHeaders: parses and holds HTTP response headers.
26 class HttpResponseHeaders
27     : public base::RefCountedThreadSafe<HttpResponseHeaders> {
28  public:
29   // Parses the given raw_headers.  raw_headers should be formatted thus:
30   // includes the http status response line, each line is \0-terminated, and
31   // it's terminated by an empty line (ie, 2 \0s in a row).
32   // (Note that line continuations should have already been joined;
33   // see HttpUtil::AssembleRawHeaders)
34   //
35   // NOTE: For now, raw_headers is not really 'raw' in that this constructor is
36   // called with a 'NativeMB' string on Windows because WinHTTP does not allow
37   // us to access the raw byte sequence as sent by a web server.  In any case,
38   // HttpResponseHeaders does not perform any encoding changes on the input.
39   //
40   explicit HttpResponseHeaders(const std::string& raw_headers);
41 
42   // Initializes from the representation stored in the given pickle.  The data
43   // for this object is found relative to the given pickle_iter, which should
44   // be passed to the pickle's various Read* methods.
45   HttpResponseHeaders(const Pickle& pickle, void** pickle_iter);
46 
47   // Persist options.
48   typedef int PersistOptions;
49   static const PersistOptions PERSIST_RAW = -1;  // Raw, unparsed headers.
50   static const PersistOptions PERSIST_ALL = 0;  // Parsed headers.
51   static const PersistOptions PERSIST_SANS_COOKIES = 1 << 0;
52   static const PersistOptions PERSIST_SANS_CHALLENGES = 1 << 1;
53   static const PersistOptions PERSIST_SANS_HOP_BY_HOP = 1 << 2;
54   static const PersistOptions PERSIST_SANS_NON_CACHEABLE = 1 << 3;
55   static const PersistOptions PERSIST_SANS_RANGES = 1 << 4;
56 
57   // Appends a representation of this object to the given pickle.
58   // The options argument can be a combination of PersistOptions.
59   void Persist(Pickle* pickle, PersistOptions options);
60 
61   // Performs header merging as described in 13.5.3 of RFC 2616.
62   void Update(const HttpResponseHeaders& new_headers);
63 
64   // Removes all instances of a particular header.
65   void RemoveHeader(const std::string& name);
66 
67   // Adds a particular header.  |header| has to be a single header without any
68   // EOL termination, just [<header-name>: <header-values>]
69   // If a header with the same name is already stored, the two headers are not
70   // merged together by this method; the one provided is simply put at the
71   // end of the list.
72   void AddHeader(const std::string& header);
73 
74   // Replaces the current status line with the provided one (|new_status| should
75   // not have any EOL).
76   void ReplaceStatusLine(const std::string& new_status);
77 
78   // Creates a normalized header string.  The output will be formatted exactly
79   // like so:
80   //     HTTP/<version> <status_code> <status_text>\n
81   //     [<header-name>: <header-values>\n]*
82   // meaning, each line is \n-terminated, and there is no extra whitespace
83   // beyond the single space separators shown (of course, values can contain
84   // whitespace within them).  If a given header-name appears more than once
85   // in the set of headers, they are combined into a single line like so:
86   //     <header-name>: <header-value1>, <header-value2>, ...<header-valueN>\n
87   //
88   // DANGER: For some headers (e.g., "Set-Cookie"), the normalized form can be
89   // a lossy format.  This is due to the fact that some servers generate
90   // Set-Cookie headers that contain unquoted commas (usually as part of the
91   // value of an "expires" attribute).  So, use this function with caution.  Do
92   // not expect to be able to re-parse Set-Cookie headers from this output.
93   //
94   // NOTE: Do not make any assumptions about the encoding of this output
95   // string.  It may be non-ASCII, and the encoding used by the server is not
96   // necessarily known to us.  Do not assume that this output is UTF-8!
97   //
98   // TODO(darin): remove this method
99   //
100   void GetNormalizedHeaders(std::string* output) const;
101 
102   // Fetch the "normalized" value of a single header, where all values for the
103   // header name are separated by commas.  See the GetNormalizedHeaders for
104   // format details.  Returns false if this header wasn't found.
105   //
106   // NOTE: Do not make any assumptions about the encoding of this output
107   // string.  It may be non-ASCII, and the encoding used by the server is not
108   // necessarily known to us.  Do not assume that this output is UTF-8!
109   //
110   // TODO(darin): remove this method
111   //
112   bool GetNormalizedHeader(const std::string& name, std::string* value) const;
113 
114   // Returns the normalized status line.  For HTTP/0.9 responses (i.e.,
115   // responses that lack a status line), this is the manufactured string
116   // "HTTP/0.9 200 OK".
117   std::string GetStatusLine() const;
118 
119   // Get the HTTP version of the normalized status line.
GetHttpVersion()120   HttpVersion GetHttpVersion() const {
121     return http_version_;
122   }
123 
124   // Get the HTTP version determined while parsing; or (0,0) if parsing failed
GetParsedHttpVersion()125   HttpVersion GetParsedHttpVersion() const {
126     return parsed_http_version_;
127   }
128 
129   // Get the HTTP status text of the normalized status line.
130   std::string GetStatusText() const;
131 
132   // Enumerate the "lines" of the response headers.  This skips over the status
133   // line.  Use GetStatusLine if you are interested in that.  Note that this
134   // method returns the un-coalesced response header lines, so if a response
135   // header appears on multiple lines, then it will appear multiple times in
136   // this enumeration (in the order the header lines were received from the
137   // server).  Initialize a 'void*' variable to NULL and pass it by address to
138   // EnumerateHeaderLines.  Call EnumerateHeaderLines repeatedly until it
139   // returns false.  The out-params 'name' and 'value' are set upon success.
140   bool EnumerateHeaderLines(void** iter,
141                             std::string* name,
142                             std::string* value) const;
143 
144   // Enumerate the values of the specified header.   If you are only interested
145   // in the first header, then you can pass NULL for the 'iter' parameter.
146   // Otherwise, to iterate across all values for the specified header,
147   // initialize a 'void*' variable to NULL and pass it by address to
148   // EnumerateHeader.  Call EnumerateHeader repeatedly until it returns false.
149   bool EnumerateHeader(void** iter,
150                        const std::string& name,
151                        std::string* value) const;
152 
153   // Returns true if the response contains the specified header-value pair.
154   // Both name and value are compared case insensitively.
155   bool HasHeaderValue(const std::string& name, const std::string& value) const;
156 
157   // Get the mime type and charset values in lower case form from the headers.
158   // Empty strings are returned if the values are not present.
159   void GetMimeTypeAndCharset(std::string* mime_type,
160                              std::string* charset) const;
161 
162   // Get the mime type in lower case from the headers.  If there's no mime
163   // type, returns false.
164   bool GetMimeType(std::string* mime_type) const;
165 
166   // Get the charset in lower case from the headers.  If there's no charset,
167   // returns false.
168   bool GetCharset(std::string* charset) const;
169 
170   // Returns true if this response corresponds to a redirect.  The target
171   // location of the redirect is optionally returned if location is non-null.
172   bool IsRedirect(std::string* location) const;
173 
174   // Returns true if the HTTP response code passed in corresponds to a
175   // redirect.
176   static bool IsRedirectResponseCode(int response_code);
177 
178   // Returns true if the response cannot be reused without validation.  The
179   // result is relative to the current_time parameter, which is a parameter to
180   // support unit testing.  The request_time parameter indicates the time at
181   // which the request was made that resulted in this response, which was
182   // received at response_time.
183   bool RequiresValidation(const base::Time& request_time,
184                           const base::Time& response_time,
185                           const base::Time& current_time) const;
186 
187   // Returns the amount of time the server claims the response is fresh from
188   // the time the response was generated.  See section 13.2.4 of RFC 2616.  See
189   // RequiresValidation for a description of the response_time parameter.
190   base::TimeDelta GetFreshnessLifetime(const base::Time& response_time) const;
191 
192   // Returns the age of the response.  See section 13.2.3 of RFC 2616.
193   // See RequiresValidation for a description of this method's parameters.
194   base::TimeDelta GetCurrentAge(const base::Time& request_time,
195                                 const base::Time& response_time,
196                                 const base::Time& current_time) const;
197 
198   // The following methods extract values from the response headers.  If a
199   // value is not present, then false is returned.  Otherwise, true is returned
200   // and the out param is assigned to the corresponding value.
201   bool GetMaxAgeValue(base::TimeDelta* value) const;
202   bool GetAgeValue(base::TimeDelta* value) const;
203   bool GetDateValue(base::Time* value) const;
204   bool GetLastModifiedValue(base::Time* value) const;
205   bool GetExpiresValue(base::Time* value) const;
206 
207   // Extracts the time value of a particular header.  This method looks for the
208   // first matching header value and parses its value as a HTTP-date.
209   bool GetTimeValuedHeader(const std::string& name, base::Time* result) const;
210 
211   // Determines if this response indicates a keep-alive connection.
212   bool IsKeepAlive() const;
213 
214   // Returns true if this response has a strong etag or last-modified header.
215   // See section 13.3.3 of RFC 2616.
216   bool HasStrongValidators() const;
217 
218   // Extracts the value of the Content-Length header or returns -1 if there is
219   // no such header in the response.
220   int64 GetContentLength() const;
221 
222   // Extracts the values in a Content-Range header and returns true if they are
223   // valid for a 206 response; otherwise returns false.
224   // The following values will be outputted:
225   // |*first_byte_position| = inclusive position of the first byte of the range
226   // |*last_byte_position| = inclusive position of the last byte of the range
227   // |*instance_length| = size in bytes of the object requested
228   // If any of the above values is unknown, its value will be -1.
229   bool GetContentRange(int64* first_byte_position,
230                        int64* last_byte_position,
231                        int64* instance_length) const;
232 
233   // Returns the HTTP response code.  This is 0 if the response code text seems
234   // to exist but could not be parsed.  Otherwise, it defaults to 200 if the
235   // response code is not found in the raw headers.
response_code()236   int response_code() const { return response_code_; }
237 
238   // Returns the raw header string.
raw_headers()239   const std::string& raw_headers() const { return raw_headers_; }
240 
241  private:
242   friend class base::RefCountedThreadSafe<HttpResponseHeaders>;
243 
244   typedef base::hash_set<std::string> HeaderSet;
245 
HttpResponseHeaders()246   HttpResponseHeaders() {}
~HttpResponseHeaders()247   ~HttpResponseHeaders() {}
248 
249   // Initializes from the given raw headers.
250   void Parse(const std::string& raw_input);
251 
252   // Helper function for ParseStatusLine.
253   // Tries to extract the "HTTP/X.Y" from a status line formatted like:
254   //    HTTP/1.1 200 OK
255   // with line_begin and end pointing at the begin and end of this line.  If the
256   // status line is malformed, returns HttpVersion(0,0).
257   static HttpVersion ParseVersion(std::string::const_iterator line_begin,
258                                   std::string::const_iterator line_end);
259 
260   // Tries to extract the status line from a header block, given the first
261   // line of said header block.  If the status line is malformed, we'll
262   // construct a valid one.  Example input:
263   //    HTTP/1.1 200 OK
264   // with line_begin and end pointing at the begin and end of this line.
265   // Output will be a normalized version of this, with a trailing \n.
266   void ParseStatusLine(std::string::const_iterator line_begin,
267                        std::string::const_iterator line_end,
268                        bool has_headers);
269 
270   // Find the header in our list (case-insensitive) starting with parsed_ at
271   // index |from|.  Returns string::npos if not found.
272   size_t FindHeader(size_t from, const std::string& name) const;
273 
274   // Add a header->value pair to our list.  If we already have header in our
275   // list, append the value to it.
276   void AddHeader(std::string::const_iterator name_begin,
277                  std::string::const_iterator name_end,
278                  std::string::const_iterator value_begin,
279                  std::string::const_iterator value_end);
280 
281   // Add to parsed_ given the fields of a ParsedHeader object.
282   void AddToParsed(std::string::const_iterator name_begin,
283                    std::string::const_iterator name_end,
284                    std::string::const_iterator value_begin,
285                    std::string::const_iterator value_end);
286 
287   // Replaces the current headers with the merged version of |raw_headers| and
288   // the current headers without the headers in |headers_to_remove|. Note that
289   // |headers_to_remove| are removed from the current headers (before the
290   // merge), not after the merge.
291   void MergeWithHeaders(const std::string& raw_headers,
292                         const HeaderSet& headers_to_remove);
293 
294   // Adds the values from any 'cache-control: no-cache="foo,bar"' headers.
295   void AddNonCacheableHeaders(HeaderSet* header_names) const;
296 
297   // Adds the set of header names that contain cookie values.
298   static void AddSensitiveHeaders(HeaderSet* header_names);
299 
300   // Adds the set of rfc2616 hop-by-hop response headers.
301   static void AddHopByHopHeaders(HeaderSet* header_names);
302 
303   // Adds the set of challenge response headers.
304   static void AddChallengeHeaders(HeaderSet* header_names);
305 
306   // Adds the set of cookie response headers.
307   static void AddCookieHeaders(HeaderSet* header_names);
308 
309   // Adds the set of content range response headers.
310   static void AddHopContentRangeHeaders(HeaderSet* header_names);
311 
312   // The members of this structure point into raw_headers_.
313   struct ParsedHeader {
314     std::string::const_iterator name_begin;
315     std::string::const_iterator name_end;
316     std::string::const_iterator value_begin;
317     std::string::const_iterator value_end;
318 
319     // A header "continuation" contains only a subsequent value for the
320     // preceding header.  (Header values are comma separated.)
is_continuationParsedHeader321     bool is_continuation() const { return name_begin == name_end; }
322   };
323   typedef std::vector<ParsedHeader> HeaderList;
324 
325   // We keep a list of ParsedHeader objects.  These tell us where to locate the
326   // header-value pairs within raw_headers_.
327   HeaderList parsed_;
328 
329   // The raw_headers_ consists of the normalized status line (terminated with a
330   // null byte) and then followed by the raw null-terminated headers from the
331   // input that was passed to our constructor.  We preserve the input [*] to
332   // maintain as much ancillary fidelity as possible (since it is sometimes
333   // hard to tell what may matter down-stream to a consumer of XMLHttpRequest).
334   // [*] The status line may be modified.
335   std::string raw_headers_;
336 
337   // This is the parsed HTTP response code.
338   int response_code_;
339 
340   // The normalized http version (consistent with what GetStatusLine() returns).
341   HttpVersion http_version_;
342 
343   // The parsed http version number (not normalized).
344   HttpVersion parsed_http_version_;
345 
346   DISALLOW_COPY_AND_ASSIGN(HttpResponseHeaders);
347 };
348 
349 }  // namespace net
350 
351 #endif  // NET_HTTP_HTTP_RESPONSE_HEADERS_H_
352