diff --git a/app/src/main/kotlin/com/svenjacobs/app/leon/startup/ContainerInitializer.kt b/app/src/main/kotlin/com/svenjacobs/app/leon/startup/ContainerInitializer.kt index 8252c811..d5d85cc2 100644 --- a/app/src/main/kotlin/com/svenjacobs/app/leon/startup/ContainerInitializer.kt +++ b/app/src/main/kotlin/com/svenjacobs/app/leon/startup/ContainerInitializer.kt @@ -58,6 +58,7 @@ import com.svenjacobs.app.leon.core.domain.sanitizer.theguardian.TheGuardianSani import com.svenjacobs.app.leon.core.domain.sanitizer.threads.ThreadsSanitizer import com.svenjacobs.app.leon.core.domain.sanitizer.tiktok.TiktokSanitizer import com.svenjacobs.app.leon.core.domain.sanitizer.webtrekk.WebtrekkSanitizer +import com.svenjacobs.app.leon.core.domain.sanitizer.wikipedia.WikipediaSanitizer import com.svenjacobs.app.leon.core.domain.sanitizer.x.XSanitizer import com.svenjacobs.app.leon.core.domain.sanitizer.yahoo.YahooSearchSanitizer import com.svenjacobs.app.leon.core.domain.sanitizer.yandex.YandexSanitizer @@ -113,6 +114,7 @@ class ContainerInitializer : DistinctInitializer { ThreadsSanitizer(), TiktokSanitizer(), WebtrekkSanitizer(), + WikipediaSanitizer(), XSanitizer(), YahooSearchSanitizer(), YandexSanitizer(), diff --git a/core-domain/src/main/kotlin/com/svenjacobs/app/leon/core/domain/sanitizer/wikipedia/WikipediaSanitizer.kt b/core-domain/src/main/kotlin/com/svenjacobs/app/leon/core/domain/sanitizer/wikipedia/WikipediaSanitizer.kt new file mode 100644 index 00000000..80d49822 --- /dev/null +++ b/core-domain/src/main/kotlin/com/svenjacobs/app/leon/core/domain/sanitizer/wikipedia/WikipediaSanitizer.kt @@ -0,0 +1,43 @@ +/* + * Léon - The URL Cleaner + * Copyright (C) 2023 Sven Jacobs + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation, either version 3 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program. If not, see . + */ + +package com.svenjacobs.app.leon.core.domain.sanitizer.wikipedia + +import android.content.Context +import com.svenjacobs.app.leon.core.common.domain.matchesDomainRegex +import com.svenjacobs.app.leon.core.common.regex.RegexFactory +import com.svenjacobs.app.leon.core.domain.R +import com.svenjacobs.app.leon.core.domain.sanitizer.RegexSanitizer +import com.svenjacobs.app.leon.core.domain.sanitizer.Sanitizer +import com.svenjacobs.app.leon.core.domain.sanitizer.SanitizerId + +class WikipediaSanitizer : + RegexSanitizer( + regex = RegexFactory.ofParameter("wprov"), + ) { + + override val id = SanitizerId("wikipedia") + + override fun getMetadata(context: Context) = Sanitizer.Metadata( + name = context.getString(R.string.sanitizer_wikipedia_name), + ) + + override fun matchesDomain(input: String) = input.matchesDomainRegex( + domain = "(.*\\.)?wikipedia.org", + ) +} diff --git a/core-domain/src/main/res/values/strings.xml b/core-domain/src/main/res/values/strings.xml index 8f2dd20c..3ac4a738 100644 --- a/core-domain/src/main/res/values/strings.xml +++ b/core-domain/src/main/res/values/strings.xml @@ -55,6 +55,7 @@ Threads.net TikTok Webtrekk + Wikipedia X (Twitter) Yahoo Search Yandex diff --git a/core-domain/src/test/kotlin/com/svenjacobs/app/leon/core/domain/sanitizer/wikipedia/WikipediaSanitizerTest.kt b/core-domain/src/test/kotlin/com/svenjacobs/app/leon/core/domain/sanitizer/wikipedia/WikipediaSanitizerTest.kt new file mode 100644 index 00000000..36e60f97 --- /dev/null +++ b/core-domain/src/test/kotlin/com/svenjacobs/app/leon/core/domain/sanitizer/wikipedia/WikipediaSanitizerTest.kt @@ -0,0 +1,56 @@ +/* + * Léon - The URL Cleaner + * Copyright (C) 2023 Sven Jacobs + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation, either version 3 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program. If not, see . + */ + +package com.svenjacobs.app.leon.core.domain.sanitizer.wikipedia + +import io.kotest.core.spec.style.WordSpec +import io.kotest.matchers.shouldBe + +class WikipediaSanitizerTest : + WordSpec( + { + val sanitizer = WikipediaSanitizer() + + "invoke" should { + + "clean en.wikipedia.org URLs" { + sanitizer("https://en.wikipedia.org/wiki/Kerosene?wprov=sfla1") shouldBe + "https://en.wikipedia.org/wiki/Kerosene" + } + } + + "matchesDomain" should { + + "match wikipedia.org" { + sanitizer.matchesDomain("https://wikipedia.org") shouldBe true + } + + "match en.wikipedia.org" { + sanitizer.matchesDomain("https://en.wikipedia.org") shouldBe true + } + + "match m.en.wikipedia.org" { + sanitizer.matchesDomain("https://de.m.wikipedia.org") shouldBe true + } + + "don't match google.com" { + sanitizer.matchesDomain("https://google.com") shouldBe false + } + } + }, + )