blob: ac8ca7ba0ff239497281092c6dc2f4dac4e45c59 [file] [log] [blame]
// Copyright 2019 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#ifndef NET_REPORTING_REPORTING_CACHE_IMPL_H_
#define NET_REPORTING_REPORTING_CACHE_IMPL_H_
#include <map>
#include <memory>
#include <set>
#include <string>
#include <unordered_map>
#include <unordered_set>
#include <utility>
#include <vector>
#include "base/macros.h"
#include "base/optional.h"
#include "base/sequence_checker.h"
#include "base/time/time.h"
#include "base/values.h"
#include "net/reporting/reporting_cache.h"
#include "net/reporting/reporting_context.h"
#include "net/reporting/reporting_endpoint.h"
#include "net/reporting/reporting_header_parser.h"
#include "net/reporting/reporting_report.h"
#include "url/gurl.h"
#include "url/origin.h"
namespace net {
class ReportingCacheImpl : public ReportingCache {
public:
ReportingCacheImpl(ReportingContext* context);
~ReportingCacheImpl() override;
// ReportingCache implementation
void AddReport(const GURL& url,
const std::string& user_agent,
const std::string& group_name,
const std::string& type,
std::unique_ptr<const base::Value> body,
int depth,
base::TimeTicks queued,
int attempts) override;
void GetReports(
std::vector<const ReportingReport*>* reports_out) const override;
base::Value GetReportsAsValue() const override;
void GetNonpendingReports(
std::vector<const ReportingReport*>* reports_out) const override;
void SetReportsPending(
const std::vector<const ReportingReport*>& reports) override;
void ClearReportsPending(
const std::vector<const ReportingReport*>& reports) override;
void IncrementReportsAttempts(
const std::vector<const ReportingReport*>& reports) override;
void IncrementEndpointDeliveries(const url::Origin& origin,
const std::string& group_name,
const GURL& url,
int reports_delivered,
bool successful) override;
void RemoveReports(const std::vector<const ReportingReport*>& reports,
ReportingReport::Outcome outcome) override;
void RemoveAllReports(ReportingReport::Outcome outcome) override;
size_t GetFullReportCountForTesting() const override;
bool IsReportPendingForTesting(const ReportingReport* report) const override;
bool IsReportDoomedForTesting(const ReportingReport* report) const override;
void OnParsedHeader(
const url::Origin& origin,
std::vector<ReportingEndpointGroup> parsed_header) override;
std::vector<url::Origin> GetAllOrigins() const override;
void RemoveClient(const url::Origin& origin) override;
void RemoveAllClients() override;
void RemoveEndpointGroup(const url::Origin& origin,
const std::string& name) override;
void RemoveEndpointsForUrl(const GURL& url) override;
void AddClientsLoadedFromStore(
std::vector<ReportingEndpoint> loaded_endpoints,
std::vector<CachedReportingEndpointGroup> loaded_endpoint_groups)
override;
std::vector<ReportingEndpoint> GetCandidateEndpointsForDelivery(
const url::Origin& origin,
const std::string& group_name) override;
base::Value GetClientsAsValue() const override;
size_t GetEndpointCount() const override;
void Flush() override;
ReportingEndpoint GetEndpointForTesting(const url::Origin& origin,
const std::string& group_name,
const GURL& url) const override;
bool EndpointGroupExistsForTesting(const url::Origin& origin,
const std::string& group_name,
OriginSubdomains include_subdomains,
base::Time expires) const override;
size_t GetEndpointGroupCountForTesting() const override;
void SetEndpointForTesting(const url::Origin& origin,
const std::string& group_name,
const GURL& url,
OriginSubdomains include_subdomains,
base::Time expires,
int priority,
int weight) override;
private:
// Represents the entire Report-To configuration for an origin.
struct OriginClient {
explicit OriginClient(url::Origin origin);
OriginClient(const OriginClient& other);
OriginClient(OriginClient&& other);
~OriginClient();
// Origin that configured this client.
const url::Origin origin;
// Total number of endpoints for this origin. Should stay in sync with the
// sum of endpoint counts for all the groups within this client.
size_t endpoint_count = 0;
// Last time that any of the groups for this origin was accessed for a
// delivery or updated via a new header. Should stay in sync with the latest
// |last_used| of all the groups within this client.
base::Time last_used;
// Set of endpoint group names for this origin.
std::set<std::string> endpoint_group_names;
};
using OriginClientMap = std::unordered_multimap<std::string, OriginClient>;
using EndpointGroupMap =
std::map<ReportingEndpointGroupKey, CachedReportingEndpointGroup>;
using EndpointMap =
std::multimap<ReportingEndpointGroupKey, ReportingEndpoint>;
void RemoveReportInternal(const ReportingReport* report);
const ReportingReport* FindReportToEvict() const;
// Sanity-checks the entire data structure of clients, groups, and endpoints,
// if DCHECK is on. The cached clients should pass this sanity check after
// completely parsing a header (i.e. not after the intermediate steps), and
// before and after any of the public methods that remove or retrieve client
// info. Also calls |sequence_checker_| to DCHECK that we are being called on
// a valid sequence.
void SanityCheckClients() const;
// Helper methods for SanityCheckClients():
#if DCHECK_IS_ON()
// Returns number of endpoint groups found in |client|.
size_t SanityCheckOriginClient(const std::string& domain,
const OriginClient& client) const;
// Returns the number of endpoints found in |group|.
size_t SanityCheckEndpointGroup(
const ReportingEndpointGroupKey& key,
const CachedReportingEndpointGroup& group) const;
void SanityCheckEndpoint(const ReportingEndpointGroupKey& key,
const ReportingEndpoint& endpoint,
EndpointMap::const_iterator endpoint_it) const;
#endif // DCHECK_IS_ON()
// Finds iterator to the client with the given |origin|, if one exists.
// Returns |origin_clients_.end()| if none is found.
OriginClientMap::iterator FindClientIt(const url::Origin& origin);
// Finds iterator to the endpoint group identified by |group_key| (origin and
// name), if one exists. Returns |endpoint_groups_.end()| if none is found.
EndpointGroupMap::iterator FindEndpointGroupIt(
const ReportingEndpointGroupKey& group_key);
// Finds iterator to the endpoint for the given |group_key| (origin and group
// name) and |url|, if one exists. Returns |endpoints_.end()| if none is
// found.
EndpointMap::iterator FindEndpointIt(
const ReportingEndpointGroupKey& group_key,
const GURL& url);
// Adds a new client, endpoint group, or endpoint to the cache, if none
// exists. If one already exists, updates the existing entry to match the new
// one.
void AddOrUpdateClient(OriginClient new_client);
void AddOrUpdateEndpointGroup(CachedReportingEndpointGroup new_group);
void AddOrUpdateEndpoint(ReportingEndpoint new_endpoint);
// Remove all the endpoints configured for |origin| and |group| whose urls are
// not in |endpoints_to_keep_urls|. Does not guarantee that all the endpoints
// in |endpoints_to_keep_urls| exist in the cache for that group.
void RemoveEndpointsInGroupOtherThan(
const ReportingEndpointGroupKey& group_key,
const std::set<GURL>& endpoints_to_keep_urls);
// Remove all the endpoint groups for |origin| whose names are not in
// |groups_to_keep_names|. Does not guarantee that all the groups in
// |groups_to_keep_names| exist in the cache for that origin.
void RemoveEndpointGroupsForOriginOtherThan(
const url::Origin& origin,
const std::set<std::string>& groups_to_keep_names);
// Gets the endpoints in the given group.
std::vector<ReportingEndpoint> GetEndpointsInGroup(
const ReportingEndpointGroupKey& group_key) const;
// Gets the number of endpoints for the given origin and group.
size_t GetEndpointCountInGroup(
const ReportingEndpointGroupKey& group_key) const;
// Updates the last_used time for the given origin and endpoint group.
void MarkEndpointGroupAndClientUsed(OriginClientMap::iterator client_it,
EndpointGroupMap::iterator group_it,
base::Time now);
// Removes the endpoint at the given iterator, which must exist in the cache.
// Also takes iterators to the client and endpoint group to avoid repeated
// lookups. May cause the client and/or group to be removed if they become
// empty, which would invalidate those iterators.
// Returns the iterator following the endpoint removed, or base::nullopt if
// either of |group_it| or |client_it| were invalidated. (If |client_it| is
// invalidated, then so must |group_it|).
base::Optional<EndpointMap::iterator> RemoveEndpointInternal(
OriginClientMap::iterator client_it,
EndpointGroupMap::iterator group_it,
EndpointMap::iterator endpoint_it);
// Removes the endpoint group at the given iterator (which must exist in the
// cache). Also takes iterator to the client to avoid repeated lookups. May
// cause the client to be removed if it becomes empty, which would
// invalidate |client_it|. If |num_endpoints_removed| is not null, then
// |*num_endpoints_removed| is incremented by the number of endpoints
// removed.
// Returns the iterator following the endpoint group removed, or base::nullopt
// if |client_it| was invalidated.
base::Optional<EndpointGroupMap::iterator> RemoveEndpointGroupInternal(
OriginClientMap::iterator client_it,
EndpointGroupMap::iterator group_it,
size_t* num_endpoints_removed = nullptr);
// Removes the client at the given iterator (which must exist in the cache),
// along with all of its endpoint groups and endpoints. Invalidates
// |client_it|.
// Returns the iterator following the client removed.
OriginClientMap::iterator RemoveClientInternal(
OriginClientMap::iterator client_it);
// Evict endpoints from |origin| and globally, if necessary to obey the
// per-origin and global endpoint limits set in the ReportingPolicy.
//
// To evict from a client: First evicts any stale or expired groups for that
// origin. If that removes enough endpoints, then stop. Otherwise, find the
// stalest group (which has not been accessed for a delivery in the longest
// time) with the most endpoints, and evict the least important endpoints from
// that group.
// To evict globally: Find the stalest client with the most endpoints and do
// the above.
void EnforcePerOriginAndGlobalEndpointLimits(const url::Origin& origin);
// Evicts endpoints from a client until it has evicted |endpoints_to_evict|
// endpoints. First tries to remove expired and stale groups. If that fails to
// satisfy the limit, finds the stalest group with the most endpoints and
// evicts the least important endpoints from it.
void EvictEndpointsFromClient(OriginClientMap::iterator client_it,
size_t endpoints_to_evict);
// Evicts the least important endpoint from a group (the endpoint with lowest
// priority and lowest weight). May cause the group and/or client to be
// deleted and the iterators invalidated.
void EvictEndpointFromGroup(OriginClientMap::iterator client_it,
EndpointGroupMap::iterator group_it);
// Removes all expired or stale groups from the given client. May delete the
// client and invalidate |client_it| if it becomes empty.
// Increments |*num_endpoints_removed| by the number of endpoints removed.
// Returns true if |client_it| was invalidated.
bool RemoveExpiredOrStaleGroups(OriginClientMap::iterator client_it,
size_t* num_endpoints_removed);
// Adds/removes (if it exists) |endpoint_it| from |endpoint_its_by_url_|.
void AddEndpointItToIndex(EndpointMap::iterator endpoint_it);
void RemoveEndpointItFromIndex(EndpointMap::iterator endpoint_it);
// Helper methods for GetClientsAsValue().
base::Value GetOriginClientAsValue(const OriginClient& client) const;
base::Value GetEndpointGroupAsValue(
const CachedReportingEndpointGroup& group) const;
base::Value GetEndpointAsValue(const ReportingEndpoint& endpoint) const;
// Convenience methods for fetching things from the context_.
const base::Clock& clock() const { return context_->clock(); }
const base::TickClock& tick_clock() const { return context_->tick_clock(); }
PersistentReportingStore* store() { return context_->store(); }
ReportingContext* context_;
// Owns all reports, keyed by const raw pointer for easier lookup.
std::unordered_map<const ReportingReport*, std::unique_ptr<ReportingReport>>
reports_;
// Reports that have been marked pending (in use elsewhere and should not be
// deleted until no longer pending).
std::unordered_set<const ReportingReport*> pending_reports_;
// Reports that have been marked doomed (would have been deleted, but were
// pending when the deletion was requested).
std::unordered_set<const ReportingReport*> doomed_reports_;
// Map of clients for all configured origins, keyed on domain name (there may
// be multiple origins per domain name).
OriginClientMap origin_clients_;
// Map of endpoint groups, keyed on origin and group name.
EndpointGroupMap endpoint_groups_;
// Map of endpoints, keyed on origin and group name (there may be multiple
// endpoints for a given origin and group, with different urls).
EndpointMap endpoints_;
// Index of endpoints stored in |endpoints_| keyed on URL, for easier lookup
// during RemoveEndpointsForUrl(). Should stay in sync with |endpoints_|.
std::multimap<GURL, EndpointMap::iterator> endpoint_its_by_url_;
SEQUENCE_CHECKER(sequence_checker_);
DISALLOW_COPY_AND_ASSIGN(ReportingCacheImpl);
};
} // namespace net
#endif // NET_REPORTING_REPORTING_CACHE_IMPL_H_