blob: d26f1790a740b3f8c5053d9baadc5e910f3e4006 [file] [log] [blame]
// Copyright 2017 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "net/reporting/reporting_header_parser.h"
#include <cstring>
#include <string>
#include <utility>
#include <vector>
#include "base/bind.h"
#include "base/check.h"
#include "base/feature_list.h"
#include "base/json/json_reader.h"
#include "base/metrics/histogram_functions.h"
#include "base/time/time.h"
#include "base/values.h"
#include "net/base/features.h"
#include "net/base/network_isolation_key.h"
#include "net/base/registry_controlled_domains/registry_controlled_domain.h"
#include "net/reporting/reporting_cache.h"
#include "net/reporting/reporting_context.h"
#include "net/reporting/reporting_delegate.h"
#include "net/reporting/reporting_endpoint.h"
namespace net {
namespace {
const char kUrlKey[] = "url";
const char kIncludeSubdomainsKey[] = "include_subdomains";
const char kEndpointsKey[] = "endpoints";
const char kGroupKey[] = "group";
const char kDefaultGroupName[] = "default";
const char kMaxAgeKey[] = "max_age";
const char kPriorityKey[] = "priority";
const char kWeightKey[] = "weight";
// Processes a single endpoint url string parsed from header.
//
// |endpoint_url_string| is the string value of the endpoint URL.
// |header_origin_url| is the origin URL that sent the header.
//
// |endpoint_url_out| is the endpoint URL parsed out of the string.
// Returns true on success or false if url was invalid.
bool ProcessEndpointURLString(const std::string& endpoint_url_string,
const url::Origin& header_origin,
GURL& endpoint_url_out) {
// Support path-absolute-URL string with exactly one leading "/"
if (std::strspn(endpoint_url_string.c_str(), "/") == 1) {
endpoint_url_out = header_origin.GetURL().Resolve(endpoint_url_string);
} else {
endpoint_url_out = GURL(endpoint_url_string);
}
if (!endpoint_url_out.is_valid())
return false;
if (!endpoint_url_out.SchemeIsCryptographic())
return false;
return true;
}
// Processes a single endpoint tuple received in a Report-To header.
//
// |origin| is the origin that sent the Report-To header.
//
// |value| is the parsed JSON value of the endpoint tuple.
//
// |*endpoint_info_out| will contain the endpoint URL parsed out of the tuple.
// Returns true on success or false if endpoint was discarded.
bool ProcessEndpoint(ReportingDelegate* delegate,
const ReportingEndpointGroupKey& group_key,
const base::Value& value,
ReportingEndpoint::EndpointInfo* endpoint_info_out) {
const base::DictionaryValue* dict = nullptr;
if (!value.GetAsDictionary(&dict))
return false;
DCHECK(dict);
std::string endpoint_url_string;
if (!dict->HasKey(kUrlKey))
return false;
if (!dict->GetString(kUrlKey, &endpoint_url_string))
return false;
GURL endpoint_url;
if (!ProcessEndpointURLString(endpoint_url_string, group_key.origin,
endpoint_url)) {
return false;
}
endpoint_info_out->url = std::move(endpoint_url);
int priority = ReportingEndpoint::EndpointInfo::kDefaultPriority;
if (dict->HasKey(kPriorityKey) && !dict->GetInteger(kPriorityKey, &priority))
return false;
if (priority < 0)
return false;
endpoint_info_out->priority = priority;
int weight = ReportingEndpoint::EndpointInfo::kDefaultWeight;
if (dict->HasKey(kWeightKey) && !dict->GetInteger(kWeightKey, &weight))
return false;
if (weight < 0)
return false;
endpoint_info_out->weight = weight;
return delegate->CanSetClient(group_key.origin, endpoint_info_out->url);
}
// Processes a single endpoint group tuple received in a Report-To header.
//
// |origin| is the origin that sent the Report-To header.
//
// |value| is the parsed JSON value of the endpoint group tuple.
// Returns true on successfully adding a non-empty group, or false if endpoint
// group was discarded or processed as a deletion.
bool ProcessEndpointGroup(ReportingDelegate* delegate,
ReportingCache* cache,
const NetworkIsolationKey& network_isolation_key,
const url::Origin& origin,
const base::Value& value,
ReportingEndpointGroup* parsed_endpoint_group_out) {
const base::DictionaryValue* dict = nullptr;
if (!value.GetAsDictionary(&dict))
return false;
DCHECK(dict);
std::string group_name = kDefaultGroupName;
if (dict->HasKey(kGroupKey) && !dict->GetString(kGroupKey, &group_name))
return false;
ReportingEndpointGroupKey group_key(network_isolation_key, origin,
group_name);
parsed_endpoint_group_out->group_key = group_key;
int ttl_sec = -1;
if (!dict->HasKey(kMaxAgeKey))
return false;
if (!dict->GetInteger(kMaxAgeKey, &ttl_sec))
return false;
if (ttl_sec < 0)
return false;
// max_age: 0 signifies removal of the endpoint group.
if (ttl_sec == 0) {
cache->RemoveEndpointGroup(group_key);
return false;
}
parsed_endpoint_group_out->ttl = base::TimeDelta::FromSeconds(ttl_sec);
bool subdomains_bool = false;
if (dict->HasKey(kIncludeSubdomainsKey) &&
dict->GetBoolean(kIncludeSubdomainsKey, &subdomains_bool) &&
subdomains_bool == true) {
// Disallow eTLDs from setting include_subdomains endpoint groups.
if (registry_controlled_domains::GetRegistryLength(
origin.GetURL(),
registry_controlled_domains::INCLUDE_UNKNOWN_REGISTRIES,
registry_controlled_domains::INCLUDE_PRIVATE_REGISTRIES) == 0) {
return false;
}
parsed_endpoint_group_out->include_subdomains = OriginSubdomains::INCLUDE;
}
const base::ListValue* endpoint_list = nullptr;
if (!dict->HasKey(kEndpointsKey))
return false;
if (!dict->GetList(kEndpointsKey, &endpoint_list))
return false;
std::vector<ReportingEndpoint::EndpointInfo> endpoints;
for (size_t i = 0; i < endpoint_list->GetSize(); i++) {
const base::Value* endpoint = nullptr;
bool got_endpoint = endpoint_list->Get(i, &endpoint);
DCHECK(got_endpoint);
ReportingEndpoint::EndpointInfo parsed_endpoint;
if (ProcessEndpoint(delegate, group_key, *endpoint, &parsed_endpoint))
endpoints.push_back(std::move(parsed_endpoint));
}
// Remove the group if it is empty.
if (endpoints.empty()) {
cache->RemoveEndpointGroup(group_key);
return false;
}
parsed_endpoint_group_out->endpoints = std::move(endpoints);
return true;
}
// Processes a single endpoint tuple received in a Reporting-Endpoints header.
//
// |group_key| is the key for the endpoint group this endpoint belongs.
// |endpoint_url_string| is the endpoint url as received in the header.
//
// |endpoint_info_out| is the endpoint info parsed out of the value.
bool ProcessEndpoint(ReportingDelegate* delegate,
const ReportingEndpointGroupKey& group_key,
const std::string& endpoint_url_string,
ReportingEndpoint::EndpointInfo& endpoint_info_out) {
if (endpoint_url_string.empty())
return false;
GURL endpoint_url;
if (!ProcessEndpointURLString(endpoint_url_string, group_key.origin,
endpoint_url)) {
return false;
}
endpoint_info_out.url = std::move(endpoint_url);
// Reporting-Endpoints endpoint doesn't have prioirty/weight so set to
// default.
endpoint_info_out.priority =
ReportingEndpoint::EndpointInfo::kDefaultPriority;
endpoint_info_out.weight = ReportingEndpoint::EndpointInfo::kDefaultWeight;
return delegate->CanSetClient(group_key.origin, endpoint_info_out.url);
}
// Process a single endpoint received in a Reporting-Endpoints header.
// Since the new header format only contains information for a single endpoint,
// the endpoint group we create here is just a wrapper for that endpoint. The
// endpoint name will be stored in the group name here as individual endpoint
// doesn't have names.
bool ProcessDocumentEndpoint(
ReportingDelegate* delegate,
ReportingCache* cache,
const NetworkIsolationKey& network_isolation_key,
const url::Origin& origin,
const std::string& endpoint_name,
const std::string& endpoint_url_string,
ReportingEndpointGroup& parsed_endpoint_group_out) {
ReportingEndpointGroupKey group_key(network_isolation_key, origin,
endpoint_name);
parsed_endpoint_group_out.group_key = group_key;
// Default to a fixed number of days as Reporting-Endpoints doesn't have the
// concept of a ttl, its lifespan will be bound to the containing document. 30
// days is picked as long enough so endpoints are unlikely to be removed
// before the document is closed.
parsed_endpoint_group_out.ttl = base::TimeDelta::FromDays(30);
ReportingEndpoint::EndpointInfo parsed_endpoint;
if (!ProcessEndpoint(delegate, group_key, endpoint_url_string,
parsed_endpoint)) {
// Remove the group if it does not have a proper endpoint.
cache->RemoveEndpointGroup(group_key);
return false;
}
parsed_endpoint_group_out.endpoints = {std::move(parsed_endpoint)};
return true;
}
} // namespace
absl::optional<base::flat_map<std::string, std::string>>
ParseReportingEndpoints(const std::string& header) {
absl::optional<structured_headers::Dictionary> header_dict =
structured_headers::ParseDictionary(header);
if (!header_dict) {
return absl::nullopt;
}
base::flat_map<std::string, std::string> parsed_header;
for (const structured_headers::DictionaryMember& entry : *header_dict) {
if (entry.second.member_is_inner_list ||
!entry.second.member.front().item.is_string()) {
return absl::nullopt;
}
const std::string& endpoint_url_string =
entry.second.member.front().item.GetString();
parsed_header[entry.first] = endpoint_url_string;
}
return parsed_header;
}
// static
void ReportingHeaderParser::RecordReportingHeaderType(
ReportingHeaderType header_type) {
base::UmaHistogramEnumeration("Net.Reporting.HeaderType", header_type);
}
// static
void ReportingHeaderParser::ParseReportToHeader(
ReportingContext* context,
const NetworkIsolationKey& network_isolation_key,
const GURL& url,
std::unique_ptr<base::Value> value) {
DCHECK(url.SchemeIsCryptographic());
const base::ListValue* group_list = nullptr;
bool is_list = value->GetAsList(&group_list);
DCHECK(is_list);
ReportingDelegate* delegate = context->delegate();
ReportingCache* cache = context->cache();
url::Origin origin = url::Origin::Create(url);
std::vector<ReportingEndpointGroup> parsed_header;
for (size_t i = 0; i < group_list->GetSize(); i++) {
const base::Value* group_value = nullptr;
bool got_group = group_list->Get(i, &group_value);
DCHECK(got_group);
ReportingEndpointGroup parsed_endpoint_group;
if (ProcessEndpointGroup(delegate, cache, network_isolation_key, origin,
*group_value, &parsed_endpoint_group)) {
parsed_header.push_back(std::move(parsed_endpoint_group));
}
}
if (parsed_header.empty() && group_list->GetSize() > 0) {
RecordReportingHeaderType(ReportingHeaderType::kReportToInvalid);
}
// Remove the client if it has no valid endpoint groups.
if (parsed_header.empty()) {
cache->RemoveClient(network_isolation_key, origin);
return;
}
RecordReportingHeaderType(ReportingHeaderType::kReportTo);
cache->OnParsedHeader(network_isolation_key, origin,
std::move(parsed_header));
}
// static
void ReportingHeaderParser::ProcessParsedReportingEndpointsHeader(
ReportingContext* context,
const NetworkIsolationKey& network_isolation_key,
const url::Origin& origin,
base::flat_map<std::string, std::string> header) {
DCHECK(base::FeatureList::IsEnabled(net::features::kDocumentReporting));
DCHECK(GURL::SchemeIsCryptographic(origin.scheme()));
ReportingDelegate* delegate = context->delegate();
ReportingCache* cache = context->cache();
std::vector<ReportingEndpointGroup> parsed_header;
for (const auto& member : header) {
ReportingEndpointGroup parsed_endpoint;
if (ProcessDocumentEndpoint(delegate, cache, network_isolation_key, origin,
member.first, member.second, parsed_endpoint)) {
parsed_header.push_back(std::move(parsed_endpoint));
}
}
// Remove the client if it has no valid endpoint groups.
if (parsed_header.empty()) {
cache->RemoveClient(network_isolation_key, origin);
return;
}
cache->OnParsedHeader(network_isolation_key, origin,
std::move(parsed_header));
}
} // namespace net