// Copyright 2022 The Chromium Authors // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #ifndef COMPONENTS_BROWSING_TOPICS_EPOCH_TOPICS_H_ #define COMPONENTS_BROWSING_TOPICS_EPOCH_TOPICS_H_ #include "base/time/time.h" #include "base/values.h" #include "components/browsing_topics/topic_and_domains.h" #include "components/browsing_topics/util.h" #include "url/origin.h" namespace browsing_topics { // Contains the epoch's top topics. This is the necessary data to calculate the // browsing topic for one epoch when a context requests it via // document.browsingTopics(). class EpochTopics { public: explicit EpochTopics(base::Time calculation_time); EpochTopics(std::vector top_topics_and_observing_domains, size_t padded_top_topics_start_index, size_t taxonomy_size, int taxonomy_version, int64_t model_version, base::Time calculation_time); EpochTopics(const EpochTopics&) = delete; EpochTopics& operator=(const EpochTopics&) = delete; EpochTopics(EpochTopics&&); EpochTopics& operator=(EpochTopics&&); ~EpochTopics(); // Serialization functions for storing in prefs. static EpochTopics FromDictValue(const base::Value::Dict& dict_value); base::Value::Dict ToDictValue() const; // Calculate the topic to expose on `top_domain` when requested by a context // where the domain hash is `hashed_context_domain`. `output_is_true_topic` // will indicate whether the returned topic (if any) is a true top topic. // `candidate_topic_filtered` will indicate whether the empty result is due to // the candicate topic is filtered. Return absl::nullopt when there are no // topics (i.e. calculation failed, or the topics were cleared), or when the // candidate topic is filtered due to the context has not observed the topic // before. The `hmac_key` is the one used to hash the domains inside // `top_topics_and_observing_domains_` and `hashed_context_domain`. absl::optional TopicForSite(const std::string& top_domain, const HashedDomain& hashed_context_domain, ReadOnlyHmacKey hmac_key, bool& output_is_true_topic, bool& candidate_topic_filtered) const; // Similar to `TopicForSite`, but this does not apply the filtering based on a // calling context, and only returns a topic if the candidate topic is a true // top topic (as opposed to the random topic, or the randomly padded top // topic). This method is used for displaying the candidate topics for a site // for the UX. absl::optional TopicForSiteForDisplay(const std::string& top_domain, ReadOnlyHmacKey hmac_key) const; // Whether `top_topics_and_observing_domains_` is empty. bool empty() const { return top_topics_and_observing_domains_.empty(); } // Clear `top_topics_and_observing_domains_` and // reset `padded_top_topics_start_index_` to 0. void ClearTopics(); // Clear an entry in `top_topics_and_observing_domains_` that matches `topic`. void ClearTopic(Topic topic); // Clear the domains in `top_topics_and_observing_domains_` that match // `hashed_context_domain`. void ClearContextDomain(const HashedDomain& hashed_context_domain); const std::vector& top_topics_and_observing_domains() const { return top_topics_and_observing_domains_; } size_t padded_top_topics_start_index() const { return padded_top_topics_start_index_; } size_t taxonomy_size() const { return taxonomy_size_; } int taxonomy_version() const { return taxonomy_version_; } int64_t model_version() const { return model_version_; } base::Time calculation_time() const { return calculation_time_; } private: absl::optional TopicForSiteHelper( const std::string& top_domain, bool need_filtering, bool allow_random_or_padded_topic, const HashedDomain& hashed_context_domain, ReadOnlyHmacKey hmac_key, bool& output_is_true_topic, bool& candidate_topic_filtered) const; // The top topics for this epoch, and the context domains that observed each // topic across // `kBrowsingTopicsNumberOfEpochsOfObservationDataToUseForFiltering` epochs. // Its length should be either equal to the configuration parameter // `kBrowsingTopicsNumberOfTopTopicsPerEpoch`, or 0, which may be due to not // enough history entries, permission denial for calculating, or history // deletion. std::vector top_topics_and_observing_domains_; // Some topics in `top_topics_and_observing_domains_` may be randomly padded // at the end. `padded_top_topics_start_index_` is the starting index of // those randomly padded topics. If all topics in // `top_topics_and_observing_domains_` are real, then // `padded_top_topics_start_index_` will equal // `top_topics_and_observing_domains_.size()`. size_t padded_top_topics_start_index_ = 0; // The size of the taxonomy applicable to this epoch's topics. size_t taxonomy_size_ = 0; // The version of the taxonomy applicable to this epoch's topics. int taxonomy_version_ = 0; // The version of the model used to calculate this epoch's topics. int64_t model_version_ = 0; // The calculation start time. This determines the end time of this epoch's // underlying topics data, and may determine the start time of future epochs' // underlying topics data. It's only best effort to read this field from a // failed calculation, as historically this field is only set for successful // calculations. base::Time calculation_time_; }; } // namespace browsing_topics #endif // COMPONENTS_BROWSING_TOPICS_EPOCH_TOPICS_H_