
421 lines
18 KiB
Raw Normal View History

2023-12-28 13:17:16 +00:00
package eu.faircode.email;
This file is part of FairEmail.
FairEmail is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
FairEmail is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with FairEmail. If not, see <http://www.gnu.org/licenses/>.
2024-01-01 07:50:49 +00:00
Copyright 2018-2024 by Marcel Bokhorst (M66B)
2023-12-28 13:17:16 +00:00
import android.content.Context;
2024-03-22 07:30:07 +00:00
import android.content.SharedPreferences;
2023-12-28 13:17:16 +00:00
import android.net.Uri;
import android.text.TextUtils;
import androidx.annotation.Nullable;
2024-03-22 07:30:07 +00:00
import androidx.preference.PreferenceManager;
2023-12-28 13:17:16 +00:00
2023-12-29 12:25:35 +00:00
import org.json.JSONException;
import java.io.BufferedOutputStream;
2023-12-28 13:17:16 +00:00
import java.io.BufferedReader;
2023-12-29 12:25:35 +00:00
import java.io.File;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.IOException;
2023-12-28 13:17:16 +00:00
import java.io.InputStreamReader;
2023-12-29 12:25:35 +00:00
import java.io.OutputStream;
import java.net.URL;
2023-12-28 13:17:16 +00:00
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collections;
2024-03-22 07:30:07 +00:00
import java.util.Date;
2023-12-28 13:17:16 +00:00
import java.util.List;
import java.util.regex.Pattern;
2023-12-29 12:25:35 +00:00
import javax.net.ssl.HttpsURLConnection;
2023-12-28 13:17:16 +00:00
public class Adguard {
// https://github.com/AdguardTeam/AdguardFilters
// https://github.com/AdguardTeam/FiltersRegistry/blob/master/filters/filter_17_TrackParam/filter.txt
2023-12-28 21:59:21 +00:00
// https://github.com/AdguardTeam/TestCases/tree/master/public/Filters/removeparam-rules
2023-12-28 13:17:16 +00:00
2023-12-29 12:25:35 +00:00
private final static int FETCH_TIMEOUT = 20 * 1000; // milliseconds
private final static String LIST = "https://raw.githubusercontent.com/AdguardTeam/FiltersRegistry/master/filters/filter_17_TrackParam/filter.txt";
2023-12-29 07:55:08 +00:00
private static final List<String> ALL_CONTENT = Collections.unmodifiableList(Arrays.asList(
2023-12-28 13:17:16 +00:00
public static Uri filter(Context context, Uri uri) {
if (uri.isOpaque())
return null;
String host = uri.getHost();
if (TextUtils.isEmpty(host))
return null;
2023-12-29 12:25:35 +00:00
File file = getFile(context);
if (!file.exists())
return null;
2023-12-28 13:17:16 +00:00
List<String> removes = new ArrayList<>();
2023-12-28 22:41:31 +00:00
List<String> importants = new ArrayList<>();
2023-12-28 13:17:16 +00:00
List<String> excepts = new ArrayList<>();
2023-12-29 12:25:35 +00:00
try (BufferedReader br = new BufferedReader(new InputStreamReader(new FileInputStream(file)))) {
2023-12-28 13:17:16 +00:00
String line;
while ((line = br.readLine()) != null) {
2023-12-28 20:33:12 +00:00
// https://adguard.com/kb/general/ad-filtering/create-own-filters/#comments
2023-12-28 13:17:16 +00:00
if (TextUtils.isEmpty(line) || line.startsWith("!"))
2023-12-28 20:33:12 +00:00
// rule = ["@@"] pattern [ "$" modifiers ]
// modifiers = [modifier0, modifier1[, ...[, modifierN]]]
2023-12-28 13:17:16 +00:00
int dollar = line.indexOf('$');
while (dollar > 0 && line.charAt(dollar - 1) == '\\')
dollar = line.indexOf('$', dollar + 1);
if (dollar < 0) {
if (!line.contains("##"))
Log.w("Adguard command missing line=" + line);
2023-12-28 20:33:12 +00:00
String pattern = line.substring(0, dollar)
2023-12-28 17:31:14 +00:00
.replace("\\$", "$");
String rest = line.substring(dollar + 1)
.replace("\\$", "$");
2023-12-28 13:17:16 +00:00
int start = 0;
2023-12-28 20:33:12 +00:00
List<String> modifiers = new ArrayList<>();
2023-12-28 13:17:16 +00:00
while (start < rest.length()) {
int comma = rest.indexOf(',', start);
while (comma > 0 && rest.charAt(comma - 1) == '\\')
comma = rest.indexOf(',', comma + 1);
int end = (comma < 0 ? rest.length() : comma);
2023-12-28 20:33:12 +00:00
modifiers.add(rest.substring(start, end)
2023-12-28 17:31:14 +00:00
.replace("\\,", ","));
2023-12-28 13:17:16 +00:00
start = (comma < 0 ? end : end + 1);
String remove = null;
2023-12-28 22:41:31 +00:00
boolean important = false;
2023-12-28 13:17:16 +00:00
boolean matches = true;
2023-12-29 07:55:08 +00:00
List<String> contents = new ArrayList<>();
2023-12-28 20:33:12 +00:00
for (String modifier : modifiers) {
int equal = modifier.indexOf('=');
String name = (equal < 0 ? modifier : modifier.substring(0, equal));
String param = (equal < 0 ? "" : modifier.substring(equal + 1));
if ("removeparam".equals(name)) {
// https://adguard.com/kb/general/ad-filtering/create-own-filters/#removeparam-modifier
remove = param;
} else if ("domain".equals(name)) {
2023-12-28 13:17:16 +00:00
// https://adguard.com/kb/general/ad-filtering/create-own-filters/#domain-modifier
2023-12-28 20:33:12 +00:00
// domains = ["~"] entry_0 ["|" ["~"] entry_1 ["|" ["~"]entry_2 ["|" ... ["|" ["~"]entry_N]]]]
// entry_i = ( regular_domain / any_tld_domain / regexp )
2023-12-28 13:17:16 +00:00
matches = false;
List<String> domains = new ArrayList<>();
start = 0;
2023-12-28 20:33:12 +00:00
while (start < param.length()) {
int pipe = param.indexOf('|', start);
while (pipe > 0 && param.charAt(pipe - 1) == '\\')
pipe = param.indexOf('|', pipe + 1);
int end = (pipe < 0 ? param.length() : pipe);
domains.add(param.substring(start, end)
2023-12-28 17:31:14 +00:00
.replace("\\|", "|"));
2023-12-28 13:17:16 +00:00
start = (pipe < 0 ? end : end + 1);
boolean and = false;
for (String domain : domains) {
boolean not = domain.startsWith("~");
if (not)
and = true;
String d = (not ? domain.substring(1) : domain);
if (d.endsWith("*")) {
// any_tld_domain
matches = host.startsWith(d.substring(0, d.length() - 1));
} else if (d.startsWith("/")) {
// regexp
int slash = d.lastIndexOf('/');
if (slash < 1) {
Log.w("Adguard missing closing slash domain=" + domain);
// the characters /, $, and | must be escaped with \
String regex = d.substring(1, slash)
.replace("\\/", "/");
Log.w("Adguard domain regex=" + regex);
matches = Pattern.compile(regex).matcher(host).find();
} else {
// regular_domain
matches = host.equals(d);
if (not)
matches = !matches;
if (matches)
Log.i("Adguard domain=" + domain + " host=" + host + " not=" + not);
if (and != matches)
2023-12-28 22:41:31 +00:00
} else if ("important".equals(name)) {
important = true;
Log.w("Adguard important=" + param);
2023-12-28 13:17:16 +00:00
} else {
2023-12-29 07:55:08 +00:00
if (name.startsWith("~")) {
name = name.substring(1);
for (String content : ALL_CONTENT)
if (!name.equals(content))
} else
2023-12-28 13:17:16 +00:00
if (remove == null || !matches)
2023-12-29 07:55:08 +00:00
// $removeparam rules that do not have any content type modifiers will match only requests where content type is document.
if (contents.size() == 0)
List<String> recognized = new ArrayList<>();
String mime = Helper.guessMimeType(uri.getLastPathSegment());
if (mime.startsWith("audio/") || mime.startsWith("video/"))
else if (mime.startsWith("image/"))
else if ("text/css".equals(mime))
else if ("application/javascript".equals(mime))
else if (mime.startsWith("font/"))
recognized.addAll(Arrays.asList("document", "subdocument", "xmlhttprequest"));
boolean found = false;
for (String content : recognized)
if (contents.contains(content)) {
found = true;
if (!found) {
Log.i("Adguard skipping mime=" + mime +
" recognized=" + TextUtils.join(", ", recognized) +
" contents=" + TextUtils.join(", ", contents) +
" line=" + line);
2023-12-28 13:17:16 +00:00
boolean except = false;
2023-12-28 20:33:12 +00:00
matches = TextUtils.isEmpty(pattern);
2023-12-28 13:17:16 +00:00
if (!matches) {
// https://adguard.com/kb/general/ad-filtering/create-own-filters/#basic-rules-special-characters
2023-12-28 20:33:12 +00:00
if (pattern.startsWith("@@")) {
// a marker that is used in rules of exception.
// To turn off filtering for a request, start your rule with this marker.
2023-12-28 13:17:16 +00:00
except = true;
2023-12-28 20:33:12 +00:00
pattern = pattern.substring(2);
2023-12-28 13:17:16 +00:00
String u = uri.toString();
2023-12-28 20:33:12 +00:00
if (pattern.startsWith("||")) {
// an indication to apply the rule to the specified domain and its subdomains.
// With this character, you do not have to specify a particular protocol and subdomain in address mask.
// It means that || stands for http://*., https://*., ws://*., wss://*. at once.
2023-12-28 13:17:16 +00:00
int ss = u.indexOf("//");
if (ss > 0)
u = u.substring(ss + 2);
2023-12-28 20:33:12 +00:00
pattern = pattern.substring(2);
2023-12-28 13:17:16 +00:00
StringBuilder b = new StringBuilder();
2023-12-28 20:33:12 +00:00
for (char c : pattern.toCharArray())
if (c == '*') {
// a wildcard character. It is used to represent any set of characters.
// This can also be an empty string or a string of any length.
2023-12-28 13:17:16 +00:00
2023-12-28 20:33:12 +00:00
} else if (c == '^') {
// a separator character mark.
// Separator character is any character, but a letter, a digit, or one of the following: _ - . %.
2023-12-28 13:17:16 +00:00
2023-12-28 20:33:12 +00:00
} else if (c == '|') {
// a pointer to the beginning or the end of address.
// The value depends on the character placement in the mask.
2023-12-28 13:17:16 +00:00
b.append(b.length() == 0 ? '^' : '$');
2023-12-28 20:33:12 +00:00
Log.w("Adguard anchor expr=" + pattern);
2023-12-28 13:17:16 +00:00
} else {
if ("\\.?![]{}()<>*+-=^$|".indexOf(c) >= 0)
matches = Pattern.compile(b.toString()).matcher(u).find();
if (matches)
Log.i("Adguard expr=" + b + " remove=" + remove + " except=" + except);
if (matches)
if (except) {
if (!excepts.contains(remove))
} else {
if (!removes.contains(remove))
2023-12-28 22:41:31 +00:00
if (important && !importants.contains(remove))
2023-12-28 13:17:16 +00:00
} catch (Throwable ex) {
try {
Uri.Builder builder = uri.buildUpon();
boolean changed = false;
for (String key : uri.getQueryParameterNames()) {
boolean omit = false;
for (String remove : removes) {
String value = uri.getQueryParameter(key);
if (omitParam(remove, key, value)) {
omit = true;
2023-12-28 22:41:31 +00:00
if (!importants.contains(remove))
for (String except : excepts)
if (omitParam(except, key, value)) {
Log.i("Adguard except=" + except);
omit = false;
2023-12-28 13:17:16 +00:00
if (omit)
changed = true;
for (String value : uri.getQueryParameters(key))
builder.appendQueryParameter(key, value);
return (changed ? builder.build() : null);
} catch (Throwable ex) {
return null;
private static boolean omitParam(String remove, String key, String value) {
// https://adguard.com/kb/general/ad-filtering/create-own-filters/#removeparam-modifier
2023-12-28 20:33:12 +00:00
if ("".equals(remove)) {
// Specify naked $removeparam to remove all query parameters
2023-12-28 13:17:16 +00:00
return true;
2023-12-28 20:33:12 +00:00
2023-12-28 13:17:16 +00:00
2023-12-28 21:59:21 +00:00
// $removeparam=~param — removes all query parameters with the name different from param.
// $removeparam=~/regexp/ — removes all query parameters that do not match the regexp regular expression.
boolean not = remove.startsWith("~");
if (not)
remove = remove.substring(1);
2023-12-28 13:17:16 +00:00
if (remove.startsWith("/")) {
2023-12-28 20:33:12 +00:00
// $removeparam=/regexp/[options]
// the only supported option is i which makes matching case-insensitive.
2023-12-28 13:17:16 +00:00
int end = remove.lastIndexOf('/');
if (end < 1) {
Log.w("Adguard missing slash remove=" + remove + " end=" + end);
return false;
String regex = remove.substring(1, end)
.replace("\\/", "/");
String rest = remove.substring(end + 1);
Log.i("Adguard regex=" + regex + " rest=" + rest);
2023-12-28 21:59:21 +00:00
int flags = 0;
if ("i".equals(rest))
flags = Pattern.CASE_INSENSITIVE;
else if (!TextUtils.isEmpty(rest))
2023-12-28 13:17:16 +00:00
Log.w("Adguard unexpected remove=" + remove);
String all = key + "=" + value;
2023-12-28 21:59:21 +00:00
if (Pattern.compile(regex, flags).matcher(all).find() ^ not) {
2023-12-28 13:17:16 +00:00
Log.i("Adguard omit regex=" + regex);
return true;
2023-12-28 21:59:21 +00:00
} else if (remove.equals(key) ^ not) {
2023-12-28 20:33:12 +00:00
// $removeparam=param
2023-12-28 13:17:16 +00:00
Log.i("Adguard omit key=" + key);
return true;
return false;
2023-12-29 12:25:35 +00:00
static void download(Context context) throws IOException, JSONException {
File file = getFile(context);
URL url = new URL(LIST);
Log.i("GET " + url);
HttpsURLConnection connection = (HttpsURLConnection) url.openConnection();
ConnectionHelper.setUserAgent(context, connection);
try {
int status = connection.getResponseCode();
if (status != HttpsURLConnection.HTTP_OK)
throw new FileNotFoundException("Error " + status + ": " + connection.getResponseMessage());
try (OutputStream os = new BufferedOutputStream(new FileOutputStream(file))) {
Helper.copy(connection.getInputStream(), os);
2024-03-22 07:30:07 +00:00
SharedPreferences prefs = PreferenceManager.getDefaultSharedPreferences(context);
prefs.edit().putLong("adguard_last", new Date().getTime()).apply();
2023-12-29 12:25:35 +00:00
} finally {
private static File getFile(Context context) {
return new File(context.getFilesDir(), "adguard.txt");
2023-12-28 13:17:16 +00:00