blob: 0f59d653ed61db84f94016fbda27f91b7ebeb1e3 [file] [log] [blame]
// Copyright 2012 The Chromium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#ifndef NET_HTTP_HTTP_RESPONSE_HEADERS_H_
#define NET_HTTP_HTTP_RESPONSE_HEADERS_H_
#include <stddef.h>
#include <stdint.h>
#include <optional>
#include <string>
#include <string_view>
#include <unordered_set>
#include <vector>
#include "base/check.h"
#include "base/functional/callback.h"
#include "base/memory/ref_counted.h"
#include "base/time/time.h"
#include "base/trace_event/base_tracing_forward.h"
#include "base/types/pass_key.h"
#include "base/values.h"
#include "net/base/net_export.h"
#include "net/http/http_util.h"
#include "net/http/http_version.h"
#include "net/log/net_log_capture_mode.h"
#include "third_party/abseil-cpp/absl/container/inlined_vector.h"
namespace base {
class Pickle;
class PickleIterator;
class Time;
class TimeDelta;
}
namespace net {
class HttpByteRange;
enum ValidationType {
VALIDATION_NONE, // The resource is fresh.
VALIDATION_ASYNCHRONOUS, // The resource requires async revalidation.
VALIDATION_SYNCHRONOUS // The resource requires sync revalidation.
};
// HttpResponseHeaders: parses and holds HTTP response headers.
class NET_EXPORT HttpResponseHeaders
: public base::RefCountedThreadSafe<HttpResponseHeaders> {
public:
// This class provides the most efficient way to build an HttpResponseHeaders
// object if the headers are all available in memory at once.
// Example usage:
// scoped_refptr<HttpResponseHeaders> headers =
// HttpResponseHeaders::Builder(HttpVersion(1, 1), 307)
// .AddHeader("Location", url.spec())
// .Build();
class NET_EXPORT Builder {
public:
// Constructs a builder with a particular `version` and `status`. `version`
// must be (1,0), (1,1) or (2,0). `status` is the response code optionally
// followed by a space and the status text, eg. "200 OK". The caller is
// required to guarantee that `status` does not contain embedded nul
// characters, and that it will remain valid until Build() is called.
Builder(HttpVersion version, std::string_view status);
Builder(const Builder&) = delete;
Builder& operator=(const Builder&) = delete;
~Builder();
// Adds a header. Returns a reference to the object so that calls can be
// chained. Duplicates will be preserved. Order will be preserved. For
// performance reasons, strings are not copied until Build() is called. It
// is the caller's responsibility to ensure the values remain valid until
// then. The caller is required to guarantee that `name` and `value` are
// valid HTTP headers and in particular that they do not contain embedded
// nul characters.
Builder& AddHeader(std::string_view name, std::string_view value) {
DCHECK(HttpUtil::IsValidHeaderName(name));
DCHECK(HttpUtil::IsValidHeaderValue(value));
headers_.push_back({name, value});
return *this;
}
scoped_refptr<HttpResponseHeaders> Build();
private:
using KeyValuePair = std::pair<std::string_view, std::string_view>;
const HttpVersion version_;
const std::string_view status_;
// 40 is enough for 94% of responses on Windows and 98% on Android.
absl::InlinedVector<KeyValuePair, 40> headers_;
};
using BuilderPassKey = base::PassKey<Builder>;
// Persist options.
typedef int PersistOptions;
static const PersistOptions PERSIST_RAW = -1; // Raw, unparsed headers.
static const PersistOptions PERSIST_ALL = 0; // Parsed headers.
static const PersistOptions PERSIST_SANS_COOKIES = 1 << 0;
static const PersistOptions PERSIST_SANS_CHALLENGES = 1 << 1;
static const PersistOptions PERSIST_SANS_HOP_BY_HOP = 1 << 2;
static const PersistOptions PERSIST_SANS_NON_CACHEABLE = 1 << 3;
static const PersistOptions PERSIST_SANS_RANGES = 1 << 4;
static const PersistOptions PERSIST_SANS_SECURITY_STATE = 1 << 5;
struct FreshnessLifetimes {
// How long the resource will be fresh for.
base::TimeDelta freshness;
// How long after becoming not fresh that the resource will be stale but
// usable (if async revalidation is enabled).
base::TimeDelta staleness;
};
static const char kContentRange[];
static const char kLastModified[];
static const char kVary[];
static constexpr std::string_view kCacheControl = "cache-control";
static constexpr std::string_view kNoStore = "no-store";
static constexpr std::string_view kNoCache = "no-cache";
static constexpr std::string_view kMustRevalidate = "must-revalidate";
static constexpr std::string_view kMaxAge = "max-age=";
static constexpr std::string_view kStaleWhileRevalidate =
"stale-while-revalidate=";
HttpResponseHeaders() = delete;
// Parses the given raw_headers. raw_headers should be formatted thus:
// includes the http status response line, each line is \0-terminated, and
// it's terminated by an empty line (ie, 2 \0s in a row).
// (Note that line continuations should have already been joined;
// see HttpUtil::AssembleRawHeaders)
//
// HttpResponseHeaders does not perform any encoding changes on the input.
//
explicit HttpResponseHeaders(std::string_view raw_headers);
// Initializes from the representation stored in the given pickle. The data
// for this object is found relative to the given pickle_iter, which should
// be passed to the pickle's various Read* methods.
explicit HttpResponseHeaders(base::PickleIterator* pickle_iter);
// Use Builder::Build() rather than calling this directly. The BuilderPassKey
// prevents accidental use from other code.
HttpResponseHeaders(
BuilderPassKey,
HttpVersion version,
std::string_view status,
base::span<const std::pair<std::string_view, std::string_view>> headers);
// Takes headers as an ASCII string and tries to parse them as HTTP response
// headers. returns nullptr on failure. Unlike the HttpResponseHeaders
// constructor that takes a std::string, HttpUtil::AssembleRawHeaders should
// not be called on |headers| before calling this method.
static scoped_refptr<HttpResponseHeaders> TryToCreate(
std::string_view headers);
// Takes content_type as an ASCII string and tries to combine it with the HTTP
// status line for data: URLs. Returns nullptr on failure. Unlike TryToCreate,
// HttpUtil::AssembleRawHeaders does not need to be called as the raw headers
// are already known.
static scoped_refptr<HttpResponseHeaders> TryToCreateForDataURL(
std::string_view content_type);
HttpResponseHeaders(const HttpResponseHeaders&) = delete;
HttpResponseHeaders& operator=(const HttpResponseHeaders&) = delete;
// Appends a representation of this object to the given pickle.
// The options argument can be a combination of PersistOptions.
void Persist(base::Pickle* pickle, PersistOptions options);
// Performs header merging as described in 13.5.3 of RFC 2616.
void Update(const HttpResponseHeaders& new_headers);
// Removes all instances of a particular header.
void RemoveHeader(std::string_view name);
// Removes all instances of particular headers.
void RemoveHeaders(const std::unordered_set<std::string>& header_names);
// Removes a particular header line. The header name is compared
// case-insensitively.
void RemoveHeaderLine(const std::string& name, const std::string& value);
// Adds the specified response header. If a header with the same name is
// already stored, the two headers are not merged together by this method; the
// one provided is simply put at the end of the list.
void AddHeader(std::string_view name, std::string_view value);
// Sets the specified response header, removing any matching old one if
// present. The new header is added to the end of the header list, rather than
// replacing the old one. This is the same as calling RemoveHeader() followed
// be SetHeader().
void SetHeader(std::string_view name, std::string_view value);
// Adds a cookie header. |cookie_string| should be the header value without
// the header name (Set-Cookie).
void AddCookie(std::string_view cookie_string);
// Replaces the current status line with the provided one (|new_status| should
// not have any EOL).
void ReplaceStatusLine(const std::string& new_status);
// Updates headers (Content-Length and Content-Range) in the |headers| to
// include the right content length and range for |byte_range|. This also
// updates HTTP status line if |replace_status_line| is true.
// |byte_range| must have a valid, bounded range (i.e. coming from a valid
// response or should be usable for a response).
void UpdateWithNewRange(const HttpByteRange& byte_range,
int64_t resource_size,
bool replace_status_line);
// Fetches the "normalized" value of a single header, where all values for the
// header name are separated by commas. This will be the sequence of strings
// that would be returned from repeated calls to EnumerateHeader, joined by
// the string ", ".
//
// Returns std::nullopt if this header wasn't found.
//
// Example:
// Foo: a, b,c
// Foo: d
//
// std::optional<std::string> value = GetNormalizedHeader("Foo");
// // Now, |value| is "a, b, c, d".
//
// NOTE: Do not make any assumptions about the encoding of this output
// string. It may be non-ASCII, and the encoding used by the server is not
// necessarily known to us. Do not assume that this output is UTF-8!
[[nodiscard]] std::optional<std::string> GetNormalizedHeader(
std::string_view name) const;
// Returns the normalized status line.
std::string GetStatusLine() const;
// Get the HTTP version of the normalized status line.
HttpVersion GetHttpVersion() const {
return http_version_;
}
// Get the HTTP status text of the normalized status line.
std::string GetStatusText() const;
// Enumerate the "lines" of the response headers. This skips over the status
// line. Use GetStatusLine if you are interested in that. Note that this
// method returns the un-coalesced response header lines, so if a response
// header appears on multiple lines, then it will appear multiple times in
// this enumeration (in the order the header lines were received from the
// server). Also, a given header might have an empty value. Initialize a
// 'size_t' variable to 0 and pass it by address to EnumerateHeaderLines.
// Call EnumerateHeaderLines repeatedly until it returns false. The
// out-params 'name' and 'value' are set upon success.
//
// WARNING: In effect, repeatedly calling EnumerateHeaderLines should return
// the same collection of (name, value) pairs that you'd obtain from passing
// each header name into EnumerateHeader and repeatedly calling
// EnumerateHeader. This means the output will *not* necessarily correspond to
// the verbatim lines of the headers. For instance, given
// Foo: a, b
// Foo: c
// EnumerateHeaderLines will output ("Foo", "a"), ("Foo", "b"), and
// ("Foo", "c").
bool EnumerateHeaderLines(size_t* iter,
std::string* name,
std::string* value) const;
// Enumerate the values of the specified header. If you are only interested
// in the first header, then you can pass nullptr for the 'iter' parameter.
// Otherwise, to iterate across all values for the specified header,
// initialize a 'size_t' variable to 0 and pass it by address to
// EnumerateHeader. Note that a header might have an empty value. Call
// EnumerateHeader repeatedly until it returns std::nullopt.
//
// The returned value remains valid for the lifetime of HttpResponseHeaders,
// or until the headers are modified, so it is legal to hold onto a returned
// string_view while continuing to enumerate other values for a header.
//
// Unless a header is explicitly marked as non-coalescing (see
// HttpUtil::IsNonCoalescingHeader), headers that contain
// comma-separated lists are treated "as if" they had been sent as
// distinct headers. That is, a header of "Foo: a, b, c" would
// enumerate into distinct values of "a", "b", and "c". This is also
// true for headers that occur multiple times in a response; unless
// they are marked non-coalescing, "Foo: a, b" followed by "Foo: c"
// will enumerate to "a", "b", "c". Commas inside quoted strings are ignored,
// for example a header of 'Foo: "a, b", "c"' would enumerate as '"a, b"',
// '"c"'.
//
// This can cause issues for headers that might have commas in fields that
// aren't quoted strings, for example a header of "Foo: <a, b>, <c>" would
// enumerate as '<a', 'b>', '<c>', rather than as '<a, b>', '<c>'.
//
// To handle cases such as this, use GetNormalizedHeader to return the full
// concatenated header, and then parse manually.
std::optional<std::string_view> EnumerateHeader(size_t* iter,
std::string_view name) const;
// Deprecated overload of EnumerateHeader. Returns a bool instead of an
// options, which is false once all headers with the provided name have been
// enumerated, and copies the header's value to `value` whenever it returns
// true.
bool EnumerateHeader(size_t* iter,
std::string_view name,
std::string* value) const;
// Returns true if the response contains the specified header-value pair.
// Both name and value are compared case insensitively.
bool HasHeaderValue(std::string_view name, std::string_view value) const;
// Returns true if the response contains the specified header.
// The name is compared case insensitively.
bool HasHeader(std::string_view name) const;
// Get the mime type and charset values in lower case form from the headers.
// Empty strings are returned if the values are not present.
void GetMimeTypeAndCharset(std::string* mime_type,
std::string* charset) const;
// Get the mime type in lower case from the headers. If there's no mime
// type, returns false.
bool GetMimeType(std::string* mime_type) const;
// Get the charset in lower case from the headers. If there's no charset,
// returns false.
bool GetCharset(std::string* charset) const;
// Returns true if this response corresponds to a redirect. The target
// location of the redirect is optionally returned if location is non-null.
bool IsRedirect(std::string* location) const;
// Returns true if this response included the `Activate-Storage-Access: retry;
// allowed-origin=...` header and the "allowed-origin" parameter matched the
// `expected_origin`.
bool HasStorageAccessRetryHeader(const std::string* expected_origin) const;
// Returns true if the HTTP response code passed in corresponds to a
// redirect.
static bool IsRedirectResponseCode(int response_code);
// Returns VALIDATION_NONE if the response can be reused without
// validation. VALIDATION_ASYNCHRONOUS means the response can be re-used, but
// asynchronous revalidation must be performed. VALIDATION_SYNCHRONOUS means
// that the result cannot be reused without revalidation.
// The result is relative to the current_time parameter, which is
// a parameter to support unit testing. The request_time parameter indicates
// the time at which the request was made that resulted in this response,
// which was received at response_time.
ValidationType RequiresValidation(base::Time request_time,
base::Time response_time,
base::Time current_time) const;
// Calculates the amount of time the server claims the response is fresh from
// the time the response was generated. See section 13.2.4 of RFC 2616. See
// RequiresValidation for a description of the response_time parameter. See
// the definition of FreshnessLifetimes above for the meaning of the return
// value. See RFC 5861 section 3 for the definition of
// stale-while-revalidate.
FreshnessLifetimes GetFreshnessLifetimes(base::Time response_time) const;
// Returns the age of the response. See section 13.2.3 of RFC 2616.
// See RequiresValidation for a description of this method's parameters.
base::TimeDelta GetCurrentAge(base::Time request_time,
base::Time response_time,
base::Time current_time) const;
// The following methods extract values from the response headers. If a value
// is not present, or is invalid, then std::nullopt is returned. Otherwise,
// the value is returned directly.
// Note that GetMaxAgeValue method is intended for testing purposes only and
// should not be used in production code.
std::optional<base::TimeDelta> GetMaxAgeValue() const;
std::optional<base::TimeDelta> GetAgeValue() const;
std::optional<base::Time> GetDateValue() const;
std::optional<base::Time> GetLastModifiedValue() const;
std::optional<base::Time> GetExpiresValue() const;
// Note that GetStaleWhileRevalidateValue method is intended for testing
// purposes only and should not be used in production code.
std::optional<base::TimeDelta> GetStaleWhileRevalidateValue() const;
// Extracts the time value of a particular header. This method looks for the
// first matching header value and parses its value as a HTTP-date.
std::optional<base::Time> GetTimeValuedHeader(const std::string& name) const;
// Determines if this response indicates a keep-alive connection.
bool IsKeepAlive() const;
// Returns true if this response has a strong etag or last-modified header.
// See section 13.3.3 of RFC 2616.
bool HasStrongValidators() const;
// Returns true if this response has any validator (either a Last-Modified or
// an ETag) regardless of whether it is strong or weak. See section 13.3.3 of
// RFC 2616.
bool HasValidators() const;
// Extracts the value of the Content-Length header or returns -1 if there is
// no such header in the response.
int64_t GetContentLength() const;
// Extracts the value of the specified header or returns -1 if there is no
// such header in the response.
int64_t GetInt64HeaderValue(const std::string& header) const;
// Extracts the values in a Content-Range header and returns true if all three
// values are present and valid for a 206 response; otherwise returns false.
// The following values will be outputted:
// |*first_byte_position| = inclusive position of the first byte of the range
// |*last_byte_position| = inclusive position of the last byte of the range
// |*instance_length| = size in bytes of the object requested
// If this method returns false, then all of the outputs will be -1.
bool GetContentRangeFor206(int64_t* first_byte_position,
int64_t* last_byte_position,
int64_t* instance_length) const;
// Returns true if the response is chunk-encoded.
bool IsChunkEncoded() const;
// Creates a Value for use with the NetLog containing the response headers.
base::Value::Dict NetLogParams(NetLogCaptureMode capture_mode) const;
// Returns the HTTP response code. This is 0 if the response code text seems
// to exist but could not be parsed. Otherwise, it defaults to 200 if the
// response code is not found in the raw headers.
int response_code() const { return response_code_; }
// Returns the raw header string.
const std::string& raw_headers() const { return raw_headers_; }
// Returns true if |name| is a cookie related header name. This is consistent
// with |PERSIST_SANS_COOKIES|.
static bool IsCookieResponseHeader(std::string_view name);
// Write a representation of this object into tracing proto.
void WriteIntoTrace(perfetto::TracedValue context) const;
// Returns true if this instance precises matches another. This is stronger
// than semantic equality as it is intended for verification that the new
// Builder implementation works correctly.
bool StrictlyEquals(const HttpResponseHeaders& other) const;
private:
friend class base::RefCountedThreadSafe<HttpResponseHeaders>;
using HeaderSet = std::unordered_set<std::string>;
// The members of this structure point into raw_headers_.
struct ParsedHeader;
typedef std::vector<ParsedHeader> HeaderList;
// Whether or not a header value passed to the private AddHeader() method
// contains commas.
enum class ContainsCommas {
kNo, // Definitely no commas. No need to parse it.
kYes, // Contains commas. Needs to be parsed.
kMaybe, // Unknown whether commas are present. Needs to be parsed.
};
struct CacheControlFreshnessDirectives {
// Whether the 'must-revalidate' directive is present
bool must_revalidate = false;
// Value of the 'max-age' directive in seconds, if present
std::optional<base::TimeDelta> max_age;
// Value of the 'stale-while-revalidate' directive in seconds, if present
std::optional<base::TimeDelta> stale_while_revalidate;
};
~HttpResponseHeaders();
// Initializes from the given raw headers.
void Parse(std::string_view raw_input);
// Helper function for ParseStatusLine.
// Tries to extract the "HTTP/X.Y" from a status line formatted like:
// HTTP/1.1 200 OK
// with line_begin and end pointing at the begin and end of this line. If the
// status line is malformed, returns HttpVersion(0,0).
static HttpVersion ParseVersion(std::string_view line);
// Tries to extract the status line from a header block, given the first
// line of said header block. If the status line is malformed, we'll
// construct a valid one. Example input:
// HTTP/1.1 200 OK
// with line_begin and end pointing at the begin and end of this line.
// Output will be a normalized version of this.
void ParseStatusLine(std::string_view line, bool has_headers);
// Find the header in our list (case-insensitive) starting with |parsed_| at
// index |from|. Returns string::npos if not found.
size_t FindHeader(size_t from, std::string_view name) const;
// Search the Cache-Control header for a directive matching |directive|. If
// present, treat its value as a time offset in seconds.
// Note that the method is intended for testing purposes only and should not
// be used in production code.
std::optional<base::TimeDelta> GetCacheControlHeaderValueForTesting(
const std::string_view directive) const;
// Add header->value pair(s) to our list. The value will be split into
// multiple values if it contains unquoted commas. If `contains_commas` is
// ContainsCommas::kNo then the value will not be parsed as a performance
// optimization. Values are all offsets within `raw_headers_`.
void AddHeader(size_t name_begin,
size_t name_end,
size_t value_begin,
size_t value_end,
ContainsCommas contains_commas);
// Add to parsed_ given the fields of a ParsedHeader object. Values are all
// offsets within `raw_headers_`.
void AddToParsed(size_t name_begin,
size_t name_end,
size_t value_begin,
size_t value_end);
// Replaces the current headers with the merged version of `raw_headers` and
// the current headers without the headers in `headers_to_remove`. Note that
// `headers_to_remove` are removed from the current headers (before the
// merge), not after the merge.
// `raw_headers` is a std::string, not a const reference to a std::string,
// to avoid a potentially excessive copy.
void MergeWithHeaders(std::string raw_headers,
const HeaderSet& headers_to_remove);
// Adds the values from any 'cache-control: no-cache="foo,bar"' headers.
void AddNonCacheableHeaders(HeaderSet* header_names) const;
// Checks if the response contains Cache-Control directives that restrict
// caching. Specifically checks for the presence of "no-cache" or "no-store"
// directives. It true if either "no-cache" or "no-store" directive is present
// in any Cache-Control header, false otherwise.
bool HasCacheRestriction() const;
// Parses Cache-Control headers to extract directives related to response
// freshness. Processes "must-revalidate", "max-age", and
// "stale-while-revalidate" directives, which control how long a cached
// response can be considered fresh and whether it can be used while
// asynchronously revalidating in the background.
CacheControlFreshnessDirectives ParseCacheControlDirectivesForFreshness()
const;
// Parses the numeric value from a Cache-Control directive that expects
// a non-negative integer value (e.g., "max-age=600" or
// "stale-while-revalidate=300"). parameter directive_size The length of the
// directive name including the equals sign. parameter value The complete
// directive string (e.g., "max-age=600"). or not a valid sequence of digits.
std::optional<base::TimeDelta> ParseSeconds(std::string_view value) const;
// Shorthand for `std::string_view(raw_headers_).substr(begin, end - begin)`.
std::string_view subrange(size_t begin, size_t end) const;
// Returns the name/value using `raw_headers_` and indices from `parsed`.
std::string_view header_name(const ParsedHeader& parsed) const;
std::string_view header_value(const ParsedHeader& parsed) const;
// Adds the set of header names that contain cookie values.
static void AddSensitiveHeaders(HeaderSet* header_names);
// Adds the set of rfc2616 hop-by-hop response headers.
static void AddHopByHopHeaders(HeaderSet* header_names);
// Adds the set of challenge response headers.
static void AddChallengeHeaders(HeaderSet* header_names);
// Adds the set of cookie response headers.
static void AddCookieHeaders(HeaderSet* header_names);
// Adds the set of content range response headers.
static void AddHopContentRangeHeaders(HeaderSet* header_names);
// Adds the set of transport security state headers.
static void AddSecurityStateHeaders(HeaderSet* header_names);
// We keep a list of ParsedHeader objects. These tell us where to locate the
// header-value pairs within raw_headers_.
HeaderList parsed_;
// The raw_headers_ consists of the normalized status line (terminated with a
// null byte) and then followed by the raw null-terminated headers from the
// input that was passed to our constructor. We preserve the input [*] to
// maintain as much ancillary fidelity as possible (since it is sometimes
// hard to tell what may matter down-stream to a consumer of XMLHttpRequest).
// [*] The status line may be modified.
std::string raw_headers_;
// This is the parsed HTTP response code.
int response_code_;
// The normalized http version (consistent with what GetStatusLine() returns).
HttpVersion http_version_;
};
using ResponseHeadersCallback =
base::RepeatingCallback<void(scoped_refptr<const HttpResponseHeaders>)>;
} // namespace net
#endif // NET_HTTP_HTTP_RESPONSE_HEADERS_H_