From 7a6dae70ee43cd8fdacf227c9385442b53992d2f Mon Sep 17 00:00:00 2001 From: Jacob Sikorski Date: Mon, 30 Oct 2023 13:27:13 -0600 Subject: [PATCH] [Uplift] Impose the max engines limitation on content blockers (uplift to 1.58.1) (#8336) * Fix #8292: Change the minimum number of engines available (#8288) * Fix #8294: Compile only the needed content blockers eagerly (#8295) Compile max content blockers --- .../Browser/Helpers/LaunchHelper.swift | 3 +- .../AdblockResourceDownloader.swift | 27 ++--- .../ContentBlockerManager.swift | 23 +++- .../FilterListCustomURLDownloader.swift | 41 +++---- .../FilterListResourceDownloader.swift | 80 ++++--------- .../ShieldStats/Adblock/AdBlockStats.swift | 110 ++++++++++++------ .../ContentBlockerManagerTests.swift | 6 +- 7 files changed, 149 insertions(+), 141 deletions(-) diff --git a/Sources/Brave/Frontend/Browser/Helpers/LaunchHelper.swift b/Sources/Brave/Frontend/Browser/Helpers/LaunchHelper.swift index a8a843ca664..1e9985d0600 100644 --- a/Sources/Brave/Frontend/Browser/Helpers/LaunchHelper.swift +++ b/Sources/Brave/Frontend/Browser/Helpers/LaunchHelper.swift @@ -88,7 +88,8 @@ public actor LaunchHelper { Task.detached(priority: .low) { // Let's disable filter lists if we have reached a maxumum amount - let enabledSources = await AdBlockStats.shared.enabledSources + let enabledSources = await AdBlockStats.shared.enabledPrioritizedSources + if enabledSources.count > AdBlockStats.maxNumberOfAllowedFilterLists { let toDisableSources = enabledSources[AdBlockStats.maxNumberOfAllowedFilterLists...] diff --git a/Sources/Brave/WebFilters/AdblockResourceDownloader.swift b/Sources/Brave/WebFilters/AdblockResourceDownloader.swift index 561c7045f99..3bc7ccc5a8c 100644 --- a/Sources/Brave/WebFilters/AdblockResourceDownloader.swift +++ b/Sources/Brave/WebFilters/AdblockResourceDownloader.swift @@ -122,35 +122,26 @@ public actor AdblockResourceDownloader: Sendable { switch resource { case .adBlockRules: let blocklistType = ContentBlockerManager.BlocklistType.generic(.blockAds) - let modes = await blocklistType.allowedModes.asyncFilter { mode in - guard allowedModes.contains(mode) else { return false } - if downloadResult.isModified { return true } - - // If the file wasn't modified, make sure we have something compiled. - // We should, but this can be false during upgrades if the identifier changed for some reason. - if await ContentBlockerManager.shared.hasRuleList(for: blocklistType, mode: mode) { - ContentBlockerManager.log.debug("Rule list already compiled for `\(blocklistType.makeIdentifier(for: mode))`") - return false - } else { - return true - } + var modes = blocklistType.allowedModes + + if !downloadResult.isModified && !allowedModes.isEmpty { + // If the download is not modified, only compile the missing modes for performance reasons + let missingModes = await ContentBlockerManager.shared.missingModes(for: blocklistType) + modes = missingModes.filter({ allowedModes.contains($0) }) } // No modes are needed to be compiled guard !modes.isEmpty else { return } do { - guard let filterSet = try resource.downloadedString() else { + guard let fileURL = resource.downloadedFileURL else { assertionFailure("This file was downloaded successfully so it should not be nil") return } - let result = try AdblockEngine.contentBlockerRules(fromFilterSet: filterSet) - // try to compile - try await ContentBlockerManager.shared.compile( - encodedContentRuleList: result.rulesJSON, for: blocklistType, - modes: modes + try await ContentBlockerManager.shared.compileRuleList( + at: fileURL, for: blocklistType, modes: modes ) } catch { ContentBlockerManager.log.error( diff --git a/Sources/Brave/WebFilters/ContentBlocker/ContentBlockerManager.swift b/Sources/Brave/WebFilters/ContentBlocker/ContentBlockerManager.swift index dbd02a78367..3891637901e 100644 --- a/Sources/Brave/WebFilters/ContentBlocker/ContentBlockerManager.swift +++ b/Sources/Brave/WebFilters/ContentBlocker/ContentBlockerManager.swift @@ -9,6 +9,7 @@ import Data import Shared import Preferences import BraveShields +import BraveCore import os.log /// A class that aids in the managment of rule lists on the rule store. @@ -165,9 +166,11 @@ actor ContentBlockerManager { } } - /// Compile the given resource and store it in cache for the given blocklist type using all allowed modes - func compile(encodedContentRuleList: String, for type: BlocklistType, options: CompileOptions = []) async throws { - try await self.compile(encodedContentRuleList: encodedContentRuleList, for: type, modes: type.allowedModes) + /// Compile the rule list found in the given local URL using the specified modes + func compileRuleList(at localFileURL: URL, for type: BlocklistType, options: CompileOptions = [], modes: [BlockingMode]) async throws { + let filterSet = try String(contentsOf: localFileURL) + let result = try AdblockEngine.contentBlockerRules(fromFilterSet: filterSet) + try await compile(encodedContentRuleList: result.rulesJSON, for: type, options: options, modes: modes) } /// Compile the given resource and store it in cache for the given blocklist type and specified modes @@ -253,6 +256,20 @@ actor ContentBlockerManager { return ruleList } + /// Return all the modes that need to be compiled for the given type + func missingModes(for type: BlocklistType) async -> [BlockingMode] { + return await type.allowedModes.asyncFilter { mode in + // If the file wasn't modified, make sure we have something compiled. + // We should, but this can be false during upgrades if the identifier changed for some reason. + if await hasRuleList(for: type, mode: mode) { + ContentBlockerManager.log.debug("Rule list already compiled for `\(type.makeIdentifier(for: mode))`") + return false + } else { + return true + } + } + } + /// Check if a rule list is compiled for this type func hasRuleList(for type: BlocklistType, mode: BlockingMode) async -> Bool { do { diff --git a/Sources/Brave/WebFilters/FilterListCustomURLDownloader.swift b/Sources/Brave/WebFilters/FilterListCustomURLDownloader.swift index 89d3c66124b..30098586b29 100644 --- a/Sources/Brave/WebFilters/FilterListCustomURLDownloader.swift +++ b/Sources/Brave/WebFilters/FilterListCustomURLDownloader.swift @@ -87,54 +87,43 @@ actor FilterListCustomURLDownloader: ObservableObject { /// Handle the download results of a custom filter list. This will process the download by compiling iOS rule lists and adding the rule list to the `AdblockEngineManager`. private func handle(downloadResult: ResourceDownloader.DownloadResult, for filterListCustomURL: FilterListCustomURL) async { let uuid = await filterListCustomURL.setting.uuid - - // Compile this rule list if we haven't already or if the file has been modified - if downloadResult.isModified { - do { - let filterSet = try String(contentsOf: downloadResult.fileURL, encoding: .utf8) - let result = try AdblockEngine.contentBlockerRules(fromFilterSet: filterSet) - let type = ContentBlockerManager.BlocklistType.customFilterList(uuid: uuid) - - try await ContentBlockerManager.shared.compile( - encodedContentRuleList: result.rulesJSON, - for: type, - options: .all - ) - - ContentBlockerManager.log.debug( - "Loaded custom filter list content blockers: \(String(describing: type))" - ) - } catch { - ContentBlockerManager.log.error( - "Failed to convert custom filter list to content blockers: \(error.localizedDescription)" - ) - } - } // Add/remove the resource depending on if it is enabled/disabled - let source = CachedAdBlockEngine.Source.filterListURL(uuid: uuid) guard let resourcesInfo = await FilterListResourceDownloader.shared.resourcesInfo else { assertionFailure("This should not have been called if the resources are not ready") return } + let source = await filterListCustomURL.setting.engineSource let version = fileVersionDateFormatter.string(from: downloadResult.date) let filterListInfo = CachedAdBlockEngine.FilterListInfo( source: .filterListURL(uuid: uuid), localFileURL: downloadResult.fileURL, version: version, fileType: .text ) + let lazyInfo = AdBlockStats.LazyFilterListInfo( + filterListInfo: filterListInfo, isAlwaysAggressive: true + ) guard await AdBlockStats.shared.isEagerlyLoaded(source: source) else { // Don't compile unless eager await AdBlockStats.shared.updateIfNeeded(resourcesInfo: resourcesInfo) await AdBlockStats.shared.updateIfNeeded(filterListInfo: filterListInfo, isAlwaysAggressive: true) + + // To free some space, remove any rule lists that are not needed + if let blocklistType = lazyInfo.blocklistType { + do { + try await ContentBlockerManager.shared.removeRuleLists(for: blocklistType) + } catch { + ContentBlockerManager.log.error("Failed to remove rule lists for \(filterListInfo.debugDescription)") + } + } return } await AdBlockStats.shared.compile( - filterListInfo: filterListInfo, resourcesInfo: resourcesInfo, - isAlwaysAggressive: true + lazyInfo: lazyInfo, resourcesInfo: resourcesInfo, + compileContentBlockers: downloadResult.isModified ) } diff --git a/Sources/Brave/WebFilters/FilterListResourceDownloader.swift b/Sources/Brave/WebFilters/FilterListResourceDownloader.swift index 24ac659f5f6..1228745addf 100644 --- a/Sources/Brave/WebFilters/FilterListResourceDownloader.swift +++ b/Sources/Brave/WebFilters/FilterListResourceDownloader.swift @@ -86,7 +86,8 @@ public actor FilterListResourceDownloader { await self.compileFilterListEngineIfNeeded( fromComponentId: componentId, folderURL: folderURL, isAlwaysAggressive: setting.isAlwaysAggressive, - resourcesInfo: resourcesInfo + resourcesInfo: resourcesInfo, + compileContentBlockers: false ) // Sleep for 1ms. This drastically reduces memory usage without much impact to usability @@ -157,14 +158,13 @@ public actor FilterListResourceDownloader { localFileURL: folderURL.appendingPathComponent("rs-ABPFilterParserData.dat", conformingTo: .data), version: version, fileType: .dat ) - - guard await AdBlockStats.shared.needsCompilation(for: filterListInfo, resourcesInfo: resourcesInfo) else { - return - } + let lazyInfo = AdBlockStats.LazyFilterListInfo( + filterListInfo: filterListInfo, isAlwaysAggressive: false + ) await AdBlockStats.shared.compile( - filterListInfo: filterListInfo, resourcesInfo: resourcesInfo, - isAlwaysAggressive: false + lazyInfo: lazyInfo, resourcesInfo: resourcesInfo, + compileContentBlockers: false ) } @@ -172,7 +172,8 @@ public actor FilterListResourceDownloader { private func compileFilterListEngineIfNeeded( fromComponentId componentId: String, folderURL: URL, isAlwaysAggressive: Bool, - resourcesInfo: CachedAdBlockEngine.ResourcesInfo + resourcesInfo: CachedAdBlockEngine.ResourcesInfo, + compileContentBlockers: Bool ) async { let version = folderURL.lastPathComponent let source = CachedAdBlockEngine.Source.filterList(componentId: componentId) @@ -181,22 +182,26 @@ public actor FilterListResourceDownloader { localFileURL: folderURL.appendingPathComponent("list.txt", conformingTo: .text), version: version, fileType: .text ) - + let lazyInfo = AdBlockStats.LazyFilterListInfo(filterListInfo: filterListInfo, isAlwaysAggressive: isAlwaysAggressive) guard await AdBlockStats.shared.isEagerlyLoaded(source: source) else { // Don't compile unless eager await AdBlockStats.shared.updateIfNeeded(resourcesInfo: resourcesInfo) await AdBlockStats.shared.updateIfNeeded(filterListInfo: filterListInfo, isAlwaysAggressive: isAlwaysAggressive) - return - } - - guard await AdBlockStats.shared.needsCompilation(for: filterListInfo, resourcesInfo: resourcesInfo) else { - // Don't compile unless needed + + // To free some space, remove any rule lists that are not needed + if let blocklistType = lazyInfo.blocklistType { + do { + try await ContentBlockerManager.shared.removeRuleLists(for: blocklistType) + } catch { + ContentBlockerManager.log.error("Failed to remove rule lists for \(filterListInfo.debugDescription)") + } + } return } await AdBlockStats.shared.compile( - filterListInfo: filterListInfo, resourcesInfo: resourcesInfo, - isAlwaysAggressive: isAlwaysAggressive + lazyInfo: lazyInfo, resourcesInfo: resourcesInfo, + compileContentBlockers: compileContentBlockers ) } @@ -258,49 +263,8 @@ public actor FilterListResourceDownloader { // Add or remove the filter list from the engine depending if it's been enabled or not await self.compileFilterListEngineIfNeeded( fromComponentId: componentId, folderURL: folderURL, isAlwaysAggressive: isAlwaysAggressive, - resourcesInfo: resourcesInfo + resourcesInfo: resourcesInfo, compileContentBlockers: loadContentBlockers ) - - // Compile this rule list if we haven't already or if the file has been modified - // We also don't load them if they are loading from cache because this will cost too much during launch - if loadContentBlockers { - let version = folderURL.lastPathComponent - let blocklistType = ContentBlockerManager.BlocklistType.filterList(componentId: componentId, isAlwaysAggressive: isAlwaysAggressive) - let modes = await blocklistType.allowedModes.asyncFilter { mode in - if let loadedVersion = await FilterListStorage.shared.loadedRuleListVersions.value[componentId] { - // if we know the loaded version we can just check it (optimization) - return loadedVersion != version - } else { - return true - } - } - - // No modes need to be compiled - guard !modes.isEmpty else { return } - - do { - let filterSet = try String(contentsOf: filterListURL, encoding: .utf8) - let result = try AdblockEngine.contentBlockerRules(fromFilterSet: filterSet) - - try await ContentBlockerManager.shared.compile( - encodedContentRuleList: result.rulesJSON, for: blocklistType, - options: .all, modes: modes - ) - - await MainActor.run { - FilterListStorage.shared.loadedRuleListVersions.value[componentId] = version - } - } catch { - ContentBlockerManager.log.error( - "Failed to create content blockers for `\(componentId)` v\(version): \(error)" - ) - #if DEBUG - ContentBlockerManager.log.debug( - "`\(componentId)`: \(filterListURL.absoluteString)" - ) - #endif - } - } } } diff --git a/Sources/Brave/WebFilters/ShieldStats/Adblock/AdBlockStats.swift b/Sources/Brave/WebFilters/ShieldStats/Adblock/AdBlockStats.swift index 1952e851e1b..58c52f962e3 100644 --- a/Sources/Brave/WebFilters/ShieldStats/Adblock/AdBlockStats.swift +++ b/Sources/Brave/WebFilters/ShieldStats/Adblock/AdBlockStats.swift @@ -13,16 +13,19 @@ import os.log public actor AdBlockStats { /// The max number of enabled filter lists depending on the amount memory available to the device static var maxNumberOfAllowedFilterLists: Int = { - let memory = Int(ProcessInfo.processInfo.physicalMemory / 1073741824) - ContentBlockerManager.log.debug("Memory: \(memory)") - return min(5 * memory, 40) + // Get the number of gigs (memory in bytes divided by the size of a gig in bytes) + let numberOfGigs = Int(ProcessInfo.processInfo.physicalMemory / 1073741824) + ContentBlockerManager.log.debug("Number of gigs (rounded down): \(numberOfGigs)") + // Take a value between 20 and 40, + // with the real value somewhere in the middle depending on the device's memory + return max(min(5 * numberOfGigs, 40), 20) }() typealias CosmeticFilterModelTuple = (isAlwaysAggressive: Bool, model: CosmeticFilterModel) public static let shared = AdBlockStats() /// An object containing the basic information to allow us to compile an engine - struct LazyFilterListInfo { + public struct LazyFilterListInfo { let filterListInfo: CachedAdBlockEngine.FilterListInfo let isAlwaysAggressive: Bool } @@ -53,6 +56,16 @@ public actor AdBlockStats { return enabledSources } + @MainActor var enabledPrioritizedSources: [CachedAdBlockEngine.Source] { + let criticalSources = Set(self.criticalSources) + var enabledSources: [CachedAdBlockEngine.Source] = [.adBlock] + enabledSources.append(contentsOf: FilterListStorage.shared.enabledSources.sorted { left, right in + return criticalSources.contains(left) && !criticalSources.contains(right) + }) + enabledSources.append(contentsOf: CustomFilterListStorage.shared.enabledSources) + return enabledSources + } + /// Tells us if we reached the max limit of already compiled filter lists var reachedMaxLimit: Bool { return cachedEngines.count >= Self.maxNumberOfAllowedFilterLists @@ -74,30 +87,42 @@ public actor AdBlockStats { /// /// - Note: This method will ensure syncronous compilation public func compile( - filterListInfo: CachedAdBlockEngine.FilterListInfo, resourcesInfo: CachedAdBlockEngine.ResourcesInfo, - isAlwaysAggressive: Bool, ignoreMaximum: Bool = false + lazyInfo: LazyFilterListInfo, resourcesInfo: CachedAdBlockEngine.ResourcesInfo, + ignoreMaximum: Bool = false, compileContentBlockers: Bool ) async { await currentCompileTask?.value - guard needsCompilation(for: filterListInfo, resourcesInfo: resourcesInfo) else { - // Ensure we only compile if we need to. This prevents two lazy loads from recompiling - return - } - currentCompileTask = Task { - if !ignoreMaximum && reachedMaxLimit && cachedEngines[filterListInfo.source] == nil { - ContentBlockerManager.log.error("Failed to compile engine for \(filterListInfo.source.debugDescription): Reached maximum!") + if !ignoreMaximum && reachedMaxLimit && cachedEngines[lazyInfo.filterListInfo.source] == nil { + ContentBlockerManager.log.error("Failed to compile engine for \(lazyInfo.filterListInfo.source.debugDescription): Reached maximum!") return } - do { - let engine = try CachedAdBlockEngine.compile( - filterListInfo: filterListInfo, resourcesInfo: resourcesInfo, isAlwaysAggressive: isAlwaysAggressive - ) + // Compile engine + if needsCompilation(for: lazyInfo.filterListInfo, resourcesInfo: resourcesInfo) { + do { + let engine = try CachedAdBlockEngine.compile( + filterListInfo: lazyInfo.filterListInfo, resourcesInfo: resourcesInfo, isAlwaysAggressive: lazyInfo.isAlwaysAggressive + ) + + add(engine: engine) + } catch { + ContentBlockerManager.log.error("Failed to compile engine for \(lazyInfo.filterListInfo.source.debugDescription)") + } + } + + // Compile content blockers + if compileContentBlockers, let blocklistType = lazyInfo.blocklistType { + let modes = await ContentBlockerManager.shared.missingModes(for: blocklistType) + guard !modes.isEmpty else { return } - add(engine: engine) - } catch { - ContentBlockerManager.log.error("Failed to compile engine for \(filterListInfo.source.debugDescription)") + do { + try await ContentBlockerManager.shared.compileRuleList( + at: lazyInfo.filterListInfo.localFileURL, for: blocklistType, modes: modes + ) + } catch { + ContentBlockerManager.log.error("Failed to compile rule list for \(lazyInfo.filterListInfo.source.debugDescription)") + } } } @@ -130,15 +155,6 @@ public actor AdBlockStats { self.resourcesInfo = resourcesInfo } - /// Remove an engine for the given source. - func removeEngine(for source: CachedAdBlockEngine.Source) { - if let filterListInfo = cachedEngines[source]?.filterListInfo { - ContentBlockerManager.log.debug("Removed engine for \(filterListInfo.debugDescription)") - } - - cachedEngines.removeValue(forKey: source) - } - /// Remove all the engines func removeAllEngines() { cachedEngines.removeAll() @@ -150,22 +166,35 @@ public actor AdBlockStats { for source in cachedEngines.keys { guard !sources.contains(source) else { continue } - removeEngine(for: source) + // Remove the engine + if let filterListInfo = cachedEngines[source]?.filterListInfo { + cachedEngines.removeValue(forKey: source) + ContentBlockerManager.log.debug("Removed engine for \(filterListInfo.debugDescription)") + } + + // Delete the Content blockers + if let lazyInfo = availableFilterLists[source], let blocklistType = lazyInfo.blocklistType { + do { + try await ContentBlockerManager.shared.removeRuleLists(for: blocklistType) + } catch { + ContentBlockerManager.log.error("Failed to remove rule lists for \(lazyInfo.filterListInfo.debugDescription)") + } + } } } /// Remove all engines that have disabled sources func ensureEnabledEngines() async { do { - for source in await enabledSources { + for source in await enabledPrioritizedSources { guard cachedEngines[source] == nil else { continue } guard let availableFilterList = availableFilterLists[source] else { continue } guard let resourcesInfo = self.resourcesInfo else { continue } await compile( - filterListInfo: availableFilterList.filterListInfo, + lazyInfo: availableFilterList, resourcesInfo: resourcesInfo, - isAlwaysAggressive: availableFilterList.isAlwaysAggressive + compileContentBlockers: true ) // Sleep for 1ms. This drastically reduces memory usage without much impact to usability @@ -335,3 +364,18 @@ private extension CachedAdBlockEngine.Source { } } } + +extension AdBlockStats.LazyFilterListInfo { + var blocklistType: ContentBlockerManager.BlocklistType? { + switch filterListInfo.source { + case .adBlock: + // Normally this should be .generic(.blockAds) + // but this content blocker is coming from slim-list + return nil + case .filterList(let componentId): + return .filterList(componentId: componentId, isAlwaysAggressive: isAlwaysAggressive) + case .filterListURL(let uuid): + return .customFilterList(uuid: uuid) + } + } +} diff --git a/Tests/ClientTests/ContentBlockerManagerTests.swift b/Tests/ClientTests/ContentBlockerManagerTests.swift index ec31086b84e..f27a2b95d9a 100644 --- a/Tests/ClientTests/ContentBlockerManagerTests.swift +++ b/Tests/ClientTests/ContentBlockerManagerTests.swift @@ -35,8 +35,10 @@ class ContentBlockerManagerTests: XCTestCase { } do { - try await manager.compile(encodedContentRuleList: encodedContentRuleList, for: .filterList(componentId: filterListUUID, isAlwaysAggressive: false)) - try await manager.compile(encodedContentRuleList: encodedContentRuleList, for: .customFilterList(uuid: filterListCustomUUID)) + let filterListType = ContentBlockerManager.BlocklistType.filterList(componentId: filterListUUID, isAlwaysAggressive: false) + try await manager.compile(encodedContentRuleList: encodedContentRuleList, for: filterListType, modes: filterListType.allowedModes) + let customListType = ContentBlockerManager.BlocklistType.customFilterList(uuid: filterListCustomUUID) + try await manager.compile(encodedContentRuleList: encodedContentRuleList, for: customListType, modes: customListType.allowedModes) } catch { XCTFail(error.localizedDescription) }