]> gitweb.stoutner.com Git - PrivacyBrowserAndroid.git/blobdiff - app/src/main/java/com/stoutner/privacybrowser/helpers/SanitizeUrlHelper.kt
Block trackers listed at privacytests.org. https://redmine.stoutner.com/issues/863
[PrivacyBrowserAndroid.git] / app / src / main / java / com / stoutner / privacybrowser / helpers / SanitizeUrlHelper.kt
diff --git a/app/src/main/java/com/stoutner/privacybrowser/helpers/SanitizeUrlHelper.kt b/app/src/main/java/com/stoutner/privacybrowser/helpers/SanitizeUrlHelper.kt
new file mode 100644 (file)
index 0000000..7e4ad98
--- /dev/null
@@ -0,0 +1,85 @@
+/*
+ * Copyright ©2022 Soren Stoutner <soren@stoutner.com>.
+ *
+ * This file is part of Privacy Browser Android <https://www.stoutner.com/privacy-browser-android>.
+ *
+ * Privacy Browser Android is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * Privacy Browser Android is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with Privacy Browser Android.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+package com.stoutner.privacybrowser.helpers
+
+private val trackingQueriesList = listOf(
+    "__hsfp=",             // HubSpot.
+    "__hssc=",             // HubSpot.
+    "__hstc=",             // HubSpot.
+    "__s=",                // Drip.com.
+    "_hsenc=",             // HubSpot.
+    "_openstat=",          // Yandex.
+    "dclid=",              // DoubleClick ID.
+    "fbadid=",             // FaceBook Ad ID.
+    "fbclid=",             // FaceBook Click ID.
+    "gclid=",              // Google Click ID.
+    "hsCtaTracking=",      // HubSpot.
+    "igshid=",             // Instagram.
+    "mc_eid=",             // MailChimp Email ID.
+    "?mkt_tok=",           // Adobe Marketo.
+    "ml_subscriber=",      // MailerLite.
+    "ml_subscriber_hash=", // MailerLite.
+    "msclkid=",            // Microsoft Click ID.
+    "oly_anon_id=",        // Omeda Anonymous ID.
+    "oly_enc_id=",         // Omeda ID.
+    "rb_clickid=",         // Unknown tracker.
+    "s_cid=",              // Adobe Site Catalyst.
+    "utm_",                // Google Analytics.
+    "vero_conv=",          // Vero.
+    "vero_id=",            // Vero ID.
+    "wickedid=",           // Wicked Reports ID.
+    "yclid="               // Yandex Click ID.
+)
+
+class SanitizeUrlHelper {
+    fun sanitizeTrackingQueries(inputUrl: String): String {
+        // Make a copy of the input URL so that it can be modified.
+        var url = inputUrl
+
+        // Remove each tracking query from the URL.
+        trackingQueriesList.forEach {
+            if (url.contains("?$it")) {  // Check for an initial query
+                // Remove the first query and anything after it.
+                url = url.substring(0, url.indexOf("?$it"))
+            }
+            else if (url.contains("&$it")) {  // Check for a subsequent query.
+                // Remove the query and anything after it.
+                url = url.substring(0, url.indexOf("&$it"))
+            }
+        }
+
+        // Return the sanitized URL.
+        return url
+    }
+
+    fun sanitizeAmpRedirects(inputUrl: String): String {
+        // Make a copy of the input URL so that it can be modified.
+        var url = inputUrl
+
+        // Remove Twitter `amp=1`.
+        if (url.contains("?amp"))
+            url = url.substring(0, url.indexOf("?amp"))
+        else if (url.contains("&amp"))
+            url = url.substring(0, url.indexOf("&amp"))
+
+        // Return the sanitized URL.
+        return url
+    }
+}
\ No newline at end of file