blob: c6e3359b9bc0dcd84f2ad8dbb07bc00e9b54c79c [file] [log] [blame]
// Copyright (c) 2012 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "extensions/common/url_pattern_set.h"
#include <iterator>
#include <ostream>
#include "base/logging.h"
#include "base/stl_util.h"
#include "base/values.h"
#include "extensions/common/error_utils.h"
#include "extensions/common/url_pattern.h"
#include "url/gurl.h"
#include "url/origin.h"
#include "url/url_constants.h"
namespace extensions {
namespace {
const char kInvalidURLPatternError[] = "Invalid url pattern '*'";
} // namespace
// static
URLPatternSet URLPatternSet::CreateDifference(const URLPatternSet& set1,
const URLPatternSet& set2) {
return URLPatternSet(base::STLSetDifference<std::set<URLPattern>>(
set1.patterns_, set2.patterns_));
}
// static
URLPatternSet URLPatternSet::CreateIntersection(
const URLPatternSet& set1,
const URLPatternSet& set2,
IntersectionBehavior intersection_behavior) {
// Note: leverage return value optimization; always return the same object.
URLPatternSet result;
if (intersection_behavior == IntersectionBehavior::kStringComparison) {
// String comparison just relies on STL set behavior, which looks at the
// string representation.
result = URLPatternSet(base::STLSetIntersection<std::set<URLPattern>>(
set1.patterns_, set2.patterns_));
return result;
}
// Look for a semantic intersection.
// Step 1: Iterate over each set. Find any patterns that are completely
// contained by the other (thus being necessarily present in any intersection)
// and add them, collecting the others in a set of unique items.
// Note: Use a collection of pointers for the uniques to avoid excessive
// copies. Since these are owned by the URLPatternSet passed in, which is
// const, this should be safe.
std::vector<const URLPattern*> unique_set1;
for (const URLPattern& pattern : set1) {
if (set2.ContainsPattern(pattern))
result.patterns_.insert(pattern);
else
unique_set1.push_back(&pattern);
}
std::vector<const URLPattern*> unique_set2;
for (const URLPattern& pattern : set2) {
if (set1.ContainsPattern(pattern))
result.patterns_.insert(pattern);
else
unique_set2.push_back(&pattern);
}
// If we're just looking for patterns contained by both, we're done.
if (intersection_behavior == IntersectionBehavior::kPatternsContainedByBoth)
return result;
DCHECK_EQ(IntersectionBehavior::kDetailed, intersection_behavior);
// Step 2: Iterate over all the unique patterns and find the intersections
// they have with the other patterns.
for (const auto* pattern : unique_set1) {
for (const auto* pattern2 : unique_set2) {
base::Optional<URLPattern> intersection =
pattern->CreateIntersection(*pattern2);
if (intersection)
result.patterns_.insert(std::move(*intersection));
}
}
return result;
}
// static
URLPatternSet URLPatternSet::CreateUnion(const URLPatternSet& set1,
const URLPatternSet& set2) {
return URLPatternSet(
base::STLSetUnion<std::set<URLPattern>>(set1.patterns_, set2.patterns_));
}
// static
URLPatternSet URLPatternSet::CreateUnion(
const std::vector<URLPatternSet>& sets) {
URLPatternSet result;
if (sets.empty())
return result;
// N-way union algorithm is basic O(nlog(n)) merge algorithm.
//
// Do the first merge step into a working set so that we don't mutate any of
// the input.
// TODO(devlin): Looks like this creates a bunch of copies; we can probably
// clean that up.
std::vector<URLPatternSet> working;
for (size_t i = 0; i < sets.size(); i += 2) {
if (i + 1 < sets.size())
working.push_back(CreateUnion(sets[i], sets[i + 1]));
else
working.push_back(sets[i].Clone());
}
for (size_t skip = 1; skip < working.size(); skip *= 2) {
for (size_t i = 0; i < (working.size() - skip); i += skip) {
URLPatternSet u = CreateUnion(working[i], working[i + skip]);
working[i].patterns_.swap(u.patterns_);
}
}
result.patterns_.swap(working[0].patterns_);
return result;
}
URLPatternSet::URLPatternSet() = default;
URLPatternSet::URLPatternSet(URLPatternSet&& rhs) = default;
URLPatternSet::URLPatternSet(const std::set<URLPattern>& patterns)
: patterns_(patterns) {}
URLPatternSet::~URLPatternSet() = default;
URLPatternSet& URLPatternSet::operator=(URLPatternSet&& rhs) = default;
bool URLPatternSet::operator==(const URLPatternSet& other) const {
return patterns_ == other.patterns_;
}
std::ostream& operator<<(std::ostream& out,
const URLPatternSet& url_pattern_set) {
out << "{ ";
auto iter = url_pattern_set.patterns().cbegin();
if (!url_pattern_set.patterns().empty()) {
out << *iter;
++iter;
}
for (;iter != url_pattern_set.patterns().end(); ++iter)
out << ", " << *iter;
if (!url_pattern_set.patterns().empty())
out << " ";
out << "}";
return out;
}
URLPatternSet URLPatternSet::Clone() const {
return URLPatternSet(patterns_);
}
bool URLPatternSet::is_empty() const {
return patterns_.empty();
}
size_t URLPatternSet::size() const {
return patterns_.size();
}
bool URLPatternSet::AddPattern(const URLPattern& pattern) {
return patterns_.insert(pattern).second;
}
void URLPatternSet::AddPatterns(const URLPatternSet& set) {
patterns_.insert(set.patterns().begin(),
set.patterns().end());
}
void URLPatternSet::ClearPatterns() {
patterns_.clear();
}
bool URLPatternSet::AddOrigin(int valid_schemes, const GURL& origin) {
if (origin.is_empty())
return false;
const url::Origin real_origin = url::Origin::Create(origin);
DCHECK(real_origin.IsSameOriginWith(url::Origin::Create(origin.GetOrigin())));
URLPattern origin_pattern(valid_schemes);
// Origin adding could fail if |origin| does not match |valid_schemes|.
if (origin_pattern.Parse(origin.spec()) !=
URLPattern::ParseResult::kSuccess) {
return false;
}
origin_pattern.SetPath("/*");
return AddPattern(origin_pattern);
}
bool URLPatternSet::Contains(const URLPatternSet& other) const {
for (auto it = other.begin(); it != other.end(); ++it) {
if (!ContainsPattern(*it))
return false;
}
return true;
}
bool URLPatternSet::ContainsPattern(const URLPattern& pattern) const {
for (auto it = begin(); it != end(); ++it) {
if (it->Contains(pattern))
return true;
}
return false;
}
bool URLPatternSet::MatchesURL(const GURL& url) const {
for (auto pattern = patterns_.cbegin(); pattern != patterns_.cend();
++pattern) {
if (pattern->MatchesURL(url))
return true;
}
return false;
}
bool URLPatternSet::MatchesAllURLs() const {
for (auto host = begin(); host != end(); ++host) {
if (host->match_all_urls() ||
(host->match_subdomains() && host->host().empty()))
return true;
}
return false;
}
bool URLPatternSet::MatchesSecurityOrigin(const GURL& origin) const {
for (auto pattern = patterns_.begin(); pattern != patterns_.end();
++pattern) {
if (pattern->MatchesSecurityOrigin(origin))
return true;
}
return false;
}
bool URLPatternSet::OverlapsWith(const URLPatternSet& other) const {
// Two extension extents overlap if there is any one URL that would match at
// least one pattern in each of the extents.
for (auto i = patterns_.cbegin(); i != patterns_.cend(); ++i) {
for (auto j = other.patterns().cbegin(); j != other.patterns().cend();
++j) {
if (i->OverlapsWith(*j))
return true;
}
}
return false;
}
std::unique_ptr<base::ListValue> URLPatternSet::ToValue() const {
std::unique_ptr<base::ListValue> value(new base::ListValue);
for (auto i = patterns_.cbegin(); i != patterns_.cend(); ++i)
value->AppendIfNotPresent(std::make_unique<base::Value>(i->GetAsString()));
return value;
}
bool URLPatternSet::Populate(const std::vector<std::string>& patterns,
int valid_schemes,
bool allow_file_access,
std::string* error) {
ClearPatterns();
for (size_t i = 0; i < patterns.size(); ++i) {
URLPattern pattern(valid_schemes);
if (pattern.Parse(patterns[i]) != URLPattern::ParseResult::kSuccess) {
if (error) {
*error = ErrorUtils::FormatErrorMessage(kInvalidURLPatternError,
patterns[i]);
} else {
LOG(ERROR) << "Invalid url pattern: " << patterns[i];
}
return false;
}
if (!allow_file_access && pattern.MatchesScheme(url::kFileScheme)) {
pattern.SetValidSchemes(
pattern.valid_schemes() & ~URLPattern::SCHEME_FILE);
}
AddPattern(pattern);
}
return true;
}
std::unique_ptr<std::vector<std::string>> URLPatternSet::ToStringVector()
const {
std::unique_ptr<std::vector<std::string>> value(new std::vector<std::string>);
for (auto i = patterns_.cbegin(); i != patterns_.cend(); ++i) {
value->push_back(i->GetAsString());
}
return value;
}
bool URLPatternSet::Populate(const base::ListValue& value,
int valid_schemes,
bool allow_file_access,
std::string* error) {
std::vector<std::string> patterns;
for (size_t i = 0; i < value.GetSize(); ++i) {
std::string item;
if (!value.GetString(i, &item))
return false;
patterns.push_back(item);
}
return Populate(patterns, valid_schemes, allow_file_access, error);
}
} // namespace extensions