summaryrefslogtreecommitdiff
path: root/Source/WebKit2/UIProcess/WebResourceLoadStatisticsStore.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'Source/WebKit2/UIProcess/WebResourceLoadStatisticsStore.cpp')
-rw-r--r--Source/WebKit2/UIProcess/WebResourceLoadStatisticsStore.cpp295
1 files changed, 295 insertions, 0 deletions
diff --git a/Source/WebKit2/UIProcess/WebResourceLoadStatisticsStore.cpp b/Source/WebKit2/UIProcess/WebResourceLoadStatisticsStore.cpp
new file mode 100644
index 000000000..7871acf9f
--- /dev/null
+++ b/Source/WebKit2/UIProcess/WebResourceLoadStatisticsStore.cpp
@@ -0,0 +1,295 @@
+/*
+ * Copyright (C) 2016-2017 Apple Inc. All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY APPLE INC. AND ITS CONTRIBUTORS ``AS IS''
+ * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
+ * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+ * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR ITS CONTRIBUTORS
+ * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+ * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+ * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
+ * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
+ * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
+ * THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include "config.h"
+#include "WebResourceLoadStatisticsStore.h"
+
+#include "WebProcessMessages.h"
+#include "WebProcessPool.h"
+#include "WebProcessProxy.h"
+#include "WebResourceLoadStatisticsStoreMessages.h"
+#include "WebsiteDataFetchOption.h"
+#include "WebsiteDataType.h"
+#include <WebCore/KeyedCoding.h>
+#include <WebCore/ResourceLoadObserver.h>
+#include <WebCore/ResourceLoadStatistics.h>
+#include <wtf/CurrentTime.h>
+#include <wtf/MainThread.h>
+#include <wtf/MathExtras.h>
+#include <wtf/RunLoop.h>
+#include <wtf/threads/BinarySemaphore.h>
+
+using namespace WebCore;
+
+namespace WebKit {
+
+static const auto featureVectorLengthThreshold = 3;
+static auto minimumTimeBetweeenDataRecordsRemoval = 60;
+static OptionSet<WebKit::WebsiteDataType> dataTypesToRemove;
+static auto notifyPages = false;
+static auto shouldClassifyResourcesBeforeDataRecordsRemoval = true;
+
+Ref<WebResourceLoadStatisticsStore> WebResourceLoadStatisticsStore::create(const String& resourceLoadStatisticsDirectory)
+{
+ return adoptRef(*new WebResourceLoadStatisticsStore(resourceLoadStatisticsDirectory));
+}
+
+WebResourceLoadStatisticsStore::WebResourceLoadStatisticsStore(const String& resourceLoadStatisticsDirectory)
+ : m_resourceLoadStatisticsStore(ResourceLoadStatisticsStore::create())
+ , m_statisticsQueue(WorkQueue::create("WebResourceLoadStatisticsStore Process Data Queue"))
+ , m_storagePath(resourceLoadStatisticsDirectory)
+{
+}
+
+WebResourceLoadStatisticsStore::~WebResourceLoadStatisticsStore()
+{
+}
+
+void WebResourceLoadStatisticsStore::setNotifyPagesWhenDataRecordsWereScanned(bool always)
+{
+ notifyPages = always;
+}
+
+void WebResourceLoadStatisticsStore::setShouldClassifyResourcesBeforeDataRecordsRemoval(bool value)
+{
+ shouldClassifyResourcesBeforeDataRecordsRemoval = value;
+}
+
+void WebResourceLoadStatisticsStore::setMinimumTimeBetweeenDataRecordsRemoval(double seconds)
+{
+ if (seconds >= 0)
+ minimumTimeBetweeenDataRecordsRemoval = seconds;
+}
+
+bool WebResourceLoadStatisticsStore::hasPrevalentResourceCharacteristics(const ResourceLoadStatistics& resourceStatistic)
+{
+ auto subresourceUnderTopFrameOriginsCount = resourceStatistic.subresourceUnderTopFrameOrigins.size();
+ auto subresourceUniqueRedirectsToCount = resourceStatistic.subresourceUniqueRedirectsTo.size();
+ auto subframeUnderTopFrameOriginsCount = resourceStatistic.subframeUnderTopFrameOrigins.size();
+
+ if (!subresourceUnderTopFrameOriginsCount
+ && !subresourceUniqueRedirectsToCount
+ && !subframeUnderTopFrameOriginsCount)
+ return false;
+
+ if (subresourceUnderTopFrameOriginsCount > featureVectorLengthThreshold
+ || subresourceUniqueRedirectsToCount > featureVectorLengthThreshold
+ || subframeUnderTopFrameOriginsCount > featureVectorLengthThreshold)
+ return true;
+
+ // The resource is considered prevalent if the feature vector
+ // is longer than the threshold.
+ // Vector length for n dimensions is sqrt(a^2 + (...) + n^2).
+ double vectorLength = 0;
+ vectorLength += subresourceUnderTopFrameOriginsCount * subresourceUnderTopFrameOriginsCount;
+ vectorLength += subresourceUniqueRedirectsToCount * subresourceUniqueRedirectsToCount;
+ vectorLength += subframeUnderTopFrameOriginsCount * subframeUnderTopFrameOriginsCount;
+
+ ASSERT(vectorLength > 0);
+
+ return sqrt(vectorLength) > featureVectorLengthThreshold;
+}
+
+void WebResourceLoadStatisticsStore::classifyResource(ResourceLoadStatistics& resourceStatistic)
+{
+ if (!resourceStatistic.isPrevalentResource && hasPrevalentResourceCharacteristics(resourceStatistic)) {
+ resourceStatistic.isPrevalentResource = true;
+ }
+}
+
+void WebResourceLoadStatisticsStore::removeDataRecords()
+{
+ if (m_dataRecordsRemovalPending)
+ return;
+
+ Vector<String> prevalentResourceDomains = coreStore().prevalentResourceDomainsWithoutUserInteraction();
+ if (!prevalentResourceDomains.size())
+ return;
+
+ double now = currentTime();
+ if (m_lastTimeDataRecordsWereRemoved
+ && now < m_lastTimeDataRecordsWereRemoved + minimumTimeBetweeenDataRecordsRemoval)
+ return;
+
+ m_dataRecordsRemovalPending = true;
+ m_lastTimeDataRecordsWereRemoved = now;
+
+ if (dataTypesToRemove.isEmpty()) {
+ dataTypesToRemove |= WebsiteDataType::Cookies;
+ dataTypesToRemove |= WebsiteDataType::DiskCache;
+ dataTypesToRemove |= WebsiteDataType::MemoryCache;
+ dataTypesToRemove |= WebsiteDataType::OfflineWebApplicationCache;
+ dataTypesToRemove |= WebsiteDataType::SessionStorage;
+ dataTypesToRemove |= WebsiteDataType::LocalStorage;
+ dataTypesToRemove |= WebsiteDataType::WebSQLDatabases;
+ dataTypesToRemove |= WebsiteDataType::IndexedDBDatabases;
+ dataTypesToRemove |= WebsiteDataType::MediaKeys;
+ dataTypesToRemove |= WebsiteDataType::HSTSCache;
+ dataTypesToRemove |= WebsiteDataType::SearchFieldRecentSearches;
+#if ENABLE(NETSCAPE_PLUGIN_API)
+ dataTypesToRemove |= WebsiteDataType::PlugInData;
+#endif
+#if ENABLE(MEDIA_STREAM)
+ dataTypesToRemove |= WebsiteDataType::MediaDeviceIdentifier;
+#endif
+ }
+
+ // Switch to the main thread to get the default website data store
+ RunLoop::main().dispatch([prevalentResourceDomains = WTFMove(prevalentResourceDomains), this] () mutable {
+ WebProcessProxy::deleteWebsiteDataForTopPrivatelyOwnedDomainsInAllPersistentDataStores(dataTypesToRemove, prevalentResourceDomains, notifyPages, [this]() mutable {
+ m_dataRecordsRemovalPending = false;
+ });
+ });
+}
+
+void WebResourceLoadStatisticsStore::processStatisticsAndDataRecords()
+{
+ if (shouldClassifyResourcesBeforeDataRecordsRemoval) {
+ coreStore().processStatistics([this] (ResourceLoadStatistics& resourceStatistic) {
+ classifyResource(resourceStatistic);
+ });
+ }
+ removeDataRecords();
+
+ auto encoder = coreStore().createEncoderFromData();
+
+ writeEncoderToDisk(*encoder.get(), "full_browsing_session");
+}
+
+void WebResourceLoadStatisticsStore::resourceLoadStatisticsUpdated(const Vector<WebCore::ResourceLoadStatistics>& origins)
+{
+ coreStore().mergeStatistics(origins);
+ processStatisticsAndDataRecords();
+}
+
+void WebResourceLoadStatisticsStore::setResourceLoadStatisticsEnabled(bool enabled)
+{
+ if (enabled == m_resourceLoadStatisticsEnabled)
+ return;
+
+ m_resourceLoadStatisticsEnabled = enabled;
+
+ readDataFromDiskIfNeeded();
+}
+
+bool WebResourceLoadStatisticsStore::resourceLoadStatisticsEnabled() const
+{
+ return m_resourceLoadStatisticsEnabled;
+}
+
+
+void WebResourceLoadStatisticsStore::registerSharedResourceLoadObserver()
+{
+ ResourceLoadObserver::sharedObserver().setStatisticsStore(m_resourceLoadStatisticsStore.copyRef());
+ m_resourceLoadStatisticsStore->setNotificationCallback([this] {
+ if (m_resourceLoadStatisticsStore->isEmpty())
+ return;
+ processStatisticsAndDataRecords();
+ });
+}
+
+void WebResourceLoadStatisticsStore::readDataFromDiskIfNeeded()
+{
+ if (!m_resourceLoadStatisticsEnabled)
+ return;
+
+ m_statisticsQueue->dispatch([this, protectedThis = makeRef(*this)] {
+ coreStore().clear();
+
+ auto decoder = createDecoderFromDisk("full_browsing_session");
+ if (!decoder)
+ return;
+
+ coreStore().readDataFromDecoder(*decoder);
+ });
+}
+
+void WebResourceLoadStatisticsStore::processWillOpenConnection(WebProcessProxy&, IPC::Connection& connection)
+{
+ connection.addWorkQueueMessageReceiver(Messages::WebResourceLoadStatisticsStore::messageReceiverName(), m_statisticsQueue.get(), this);
+}
+
+void WebResourceLoadStatisticsStore::processDidCloseConnection(WebProcessProxy&, IPC::Connection& connection)
+{
+ connection.removeWorkQueueMessageReceiver(Messages::WebResourceLoadStatisticsStore::messageReceiverName());
+}
+
+void WebResourceLoadStatisticsStore::applicationWillTerminate()
+{
+ BinarySemaphore semaphore;
+ m_statisticsQueue->dispatch([this, &semaphore] {
+ // Make sure any ongoing work in our queue is finished before we terminate.
+ semaphore.signal();
+ });
+ semaphore.wait(WallTime::infinity());
+}
+
+String WebResourceLoadStatisticsStore::persistentStoragePath(const String& label) const
+{
+ if (m_storagePath.isEmpty())
+ return emptyString();
+
+ // TODO Decide what to call this file
+ return pathByAppendingComponent(m_storagePath, label + "_resourceLog.plist");
+}
+
+void WebResourceLoadStatisticsStore::writeEncoderToDisk(KeyedEncoder& encoder, const String& label) const
+{
+ RefPtr<SharedBuffer> rawData = encoder.finishEncoding();
+ if (!rawData)
+ return;
+
+ String resourceLog = persistentStoragePath(label);
+ if (resourceLog.isEmpty())
+ return;
+
+ if (!m_storagePath.isEmpty())
+ makeAllDirectories(m_storagePath);
+
+ auto handle = openFile(resourceLog, OpenForWrite);
+ if (!handle)
+ return;
+
+ int64_t writtenBytes = writeToFile(handle, rawData->data(), rawData->size());
+ closeFile(handle);
+
+ if (writtenBytes != static_cast<int64_t>(rawData->size()))
+ WTFLogAlways("WebResourceLoadStatisticsStore: We only wrote %d out of %d bytes to disk", static_cast<unsigned>(writtenBytes), rawData->size());
+}
+
+std::unique_ptr<KeyedDecoder> WebResourceLoadStatisticsStore::createDecoderFromDisk(const String& label) const
+{
+ String resourceLog = persistentStoragePath(label);
+ if (resourceLog.isEmpty())
+ return nullptr;
+
+ RefPtr<SharedBuffer> rawData = SharedBuffer::createWithContentsOfFile(resourceLog);
+ if (!rawData)
+ return nullptr;
+
+ return KeyedDecoder::decoder(reinterpret_cast<const uint8_t*>(rawData->data()), rawData->size());
+}
+
+} // namespace WebKit