blob: 3804a1cef10633e8b357467f13c00d1385dd6f65 [file] [log] [blame]
// Copyright (c) 2011 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
// This class is used by the RenderView to interact with a PhishingClassifier.
#include <memory>
#include "base/macros.h"
#include "base/strings/string16.h"
#include "content/public/renderer/render_frame_observer.h"
#include "content/public/renderer/render_thread_observer.h"
#include "ui/base/page_transition_types.h"
#include "url/gurl.h"
namespace safe_browsing {
class ClientPhishingRequest;
class PhishingClassifier;
class Scorer;
class PhishingClassifierFilter : public content::RenderThreadObserver {
static PhishingClassifierFilter* Create();
~PhishingClassifierFilter() override;
bool OnControlMessageReceived(const IPC::Message& message) override;
void OnSetPhishingModel(const std::string& model);
class PhishingClassifierDelegate : public content::RenderFrameObserver {
// The RenderFrame owns us. This object takes ownership of the classifier.
// Note that if classifier is null, a default instance of PhishingClassifier
// will be used.
static PhishingClassifierDelegate* Create(content::RenderFrame* render_frame,
PhishingClassifier* classifier);
~PhishingClassifierDelegate() override;
// Called by the RenderFrame once there is a phishing scorer available.
// The scorer is passed on to the classifier.
void SetPhishingScorer(const safe_browsing::Scorer* scorer);
// Called by the RenderFrame once a page has finished loading. Updates the
// last-loaded URL and page text, then starts classification if all other
// conditions are met (see MaybeStartClassification for details).
// We ignore preliminary captures, since these happen before the page has
// finished loading.
void PageCaptured(base::string16* page_text, bool preliminary_capture);
// RenderFrameObserver implementation, public for testing.
// Called by the RenderFrame when a page has started loading in the given
// WebFrame. Typically, this will cause any pending classification to be
// cancelled. However, if the navigation is within the same page, we
// continue running the current classification.
void DidCommitProvisionalLoad(bool is_new_navigation,
bool is_same_page_navigation) override;
friend class PhishingClassifierDelegateTest;
PhishingClassifierDelegate(content::RenderFrame* render_frame,
PhishingClassifier* classifier);
enum CancelClassificationReason {
CANCEL_CLASSIFICATION_MAX // Always add new values before this one.
// Cancels any pending classification and frees the page text.
void CancelPendingClassification(CancelClassificationReason reason);
// RenderFrameObserver implementation.
bool OnMessageReceived(const IPC::Message& message) override;
void OnDestruct() override;
// Called by the RenderFrame when it receives a StartPhishingDetection IPC
// from the browser. This signals that it is ok to begin classification
// for the given toplevel URL. If the URL has been fully loaded into the
// RenderFrame and a Scorer has been set, this will begin classification,
// otherwise classification will be deferred until these conditions are met.
void OnStartPhishingDetection(const GURL& url);
// Called when classification for the current page finishes.
void ClassificationDone(const ClientPhishingRequest& verdict);
// Shared code to begin classification if all conditions are met.
void MaybeStartClassification();
// The PhishingClassifier to use for the RenderFrame. This is created once
// a scorer is made available via SetPhishingScorer().
std::unique_ptr<PhishingClassifier> classifier_;
// The last URL that the browser instructed us to classify,
// with the ref stripped.
GURL last_url_received_from_browser_;
// The last top-level URL that has finished loading in the RenderFrame.
// This corresponds to the text in classifier_page_text_.
GURL last_finished_load_url_;
// The transition type for the last load in the main frame. We use this
// to exclude back/forward loads from classification. Note that this is
// set in DidCommitProvisionalLoad(); the transition is reset after this
// call in the RenderFrame, so we need to save off the value.
ui::PageTransition last_main_frame_transition_;
// The URL of the last load that we actually started classification on.
// This is used to suppress phishing classification on subframe navigation
// and back and forward navigations in history.
GURL last_url_sent_to_classifier_;
// The page text that will be analyzed by the phishing classifier. This is
// set by OnNavigate and cleared when the classifier finishes. Note that if
// there is no Scorer yet when OnNavigate is called, or the browser has not
// instructed us to classify the page, the page text will be cached until
// these conditions are met.
base::string16 classifier_page_text_;
// Tracks whether we have stored anything in classifier_page_text_ for the
// most recent load. We use this to distinguish empty text from cases where
// PageCaptured has not been called.
bool have_page_text_;
// Set to true if the classifier is currently running.
bool is_classifying_;
} // namespace safe_browsing