// Copyright 2011 The Chromium Authors // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. // // PhishingTermFeatureExtractor handles computing term features from the text // of a web page for the client-side phishing detection model. To do this, it // takes a list of terms that appear in the model, and scans through the page // text looking for them. Any terms that appear will cause a corresponding // features::kPageTerm feature to be added to the FeatureMap. // // To make it harder for a phisher to enumerate all of the relevant terms in // the model, the terms are provided as SHA-256 hashes, rather than plain text. // // There is one PhishingTermFeatureExtractor per RenderView. #ifndef COMPONENTS_SAFE_BROWSING_CONTENT_RENDERER_PHISHING_CLASSIFIER_PHISHING_TERM_FEATURE_EXTRACTOR_H_ #define COMPONENTS_SAFE_BROWSING_CONTENT_RENDERER_PHISHING_CLASSIFIER_PHISHING_TERM_FEATURE_EXTRACTOR_H_ #include <stddef.h> #include <stdint.h> #include <memory> #include <set> #include <string> #include <string_view> #include <unordered_set> #include "base/functional/callback.h" #include "base/memory/raw_ptr.h" #include "base/memory/weak_ptr.h" #include "base/time/tick_clock.h" namespace safe_browsing { class FeatureMap; class PhishingTermFeatureExtractor { … }; } // namespace safe_browsing #endif // COMPONENTS_SAFE_BROWSING_CONTENT_RENDERER_PHISHING_CLASSIFIER_PHISHING_TERM_FEATURE_EXTRACTOR_H_