2018-08-02 13:33:06 +00:00
|
|
|
package eu.faircode.email;
|
|
|
|
|
|
|
|
/*
|
2018-08-14 05:53:24 +00:00
|
|
|
This file is part of FairEmail.
|
2018-08-02 13:33:06 +00:00
|
|
|
|
2018-08-14 05:53:24 +00:00
|
|
|
FairEmail is free software: you can redistribute it and/or modify
|
2018-08-02 13:33:06 +00:00
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
|
|
(at your option) any later version.
|
|
|
|
|
2018-10-29 10:46:49 +00:00
|
|
|
FairEmail is distributed in the hope that it will be useful,
|
2018-08-02 13:33:06 +00:00
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
2018-10-29 10:46:49 +00:00
|
|
|
along with FairEmail. If not, see <http://www.gnu.org/licenses/>.
|
2018-08-02 13:33:06 +00:00
|
|
|
|
2020-01-05 17:32:53 +00:00
|
|
|
Copyright 2018-2020 by Marcel Bokhorst (M66B)
|
2018-08-02 13:33:06 +00:00
|
|
|
*/
|
|
|
|
|
2018-12-14 09:11:45 +00:00
|
|
|
import android.content.Context;
|
2019-03-10 18:03:05 +00:00
|
|
|
import android.content.SharedPreferences;
|
2019-10-04 21:04:03 +00:00
|
|
|
import android.graphics.Bitmap;
|
|
|
|
import android.graphics.Canvas;
|
2019-09-24 12:46:12 +00:00
|
|
|
import android.graphics.Color;
|
2019-10-04 21:04:03 +00:00
|
|
|
import android.graphics.drawable.Drawable;
|
2019-09-13 11:46:52 +00:00
|
|
|
import android.net.Uri;
|
2019-09-07 18:13:58 +00:00
|
|
|
import android.os.Build;
|
2019-02-10 12:01:21 +00:00
|
|
|
import android.text.Html;
|
2019-08-29 19:57:04 +00:00
|
|
|
import android.text.SpannableStringBuilder;
|
2019-02-10 12:01:21 +00:00
|
|
|
import android.text.Spanned;
|
2018-12-14 09:11:45 +00:00
|
|
|
import android.text.TextUtils;
|
2019-08-29 19:57:04 +00:00
|
|
|
import android.text.style.ForegroundColorSpan;
|
2018-12-14 09:11:45 +00:00
|
|
|
import android.util.Base64;
|
2020-03-26 14:25:44 +00:00
|
|
|
import android.view.textclassifier.TextClassificationManager;
|
|
|
|
import android.view.textclassifier.TextLanguage;
|
2018-12-14 09:11:45 +00:00
|
|
|
|
2019-04-17 18:21:44 +00:00
|
|
|
import androidx.annotation.NonNull;
|
|
|
|
import androidx.annotation.Nullable;
|
2019-10-04 21:04:03 +00:00
|
|
|
import androidx.core.content.ContextCompat;
|
2020-02-14 08:34:28 +00:00
|
|
|
import androidx.core.content.FileProvider;
|
2020-01-26 12:41:12 +00:00
|
|
|
import androidx.core.graphics.ColorUtils;
|
2019-04-17 18:21:44 +00:00
|
|
|
import androidx.core.text.HtmlCompat;
|
|
|
|
import androidx.core.util.PatternsCompat;
|
|
|
|
import androidx.preference.PreferenceManager;
|
|
|
|
|
2020-04-21 07:04:55 +00:00
|
|
|
import com.steadystate.css.dom.CSSMediaRuleImpl;
|
2020-04-20 13:01:05 +00:00
|
|
|
import com.steadystate.css.dom.CSSStyleRuleImpl;
|
2020-04-21 07:04:55 +00:00
|
|
|
import com.steadystate.css.dom.MediaListImpl;
|
2020-04-20 13:01:05 +00:00
|
|
|
import com.steadystate.css.parser.CSSOMParser;
|
|
|
|
import com.steadystate.css.parser.SACParserCSS3;
|
|
|
|
import com.steadystate.css.parser.selectors.ClassConditionImpl;
|
|
|
|
import com.steadystate.css.parser.selectors.ConditionalSelectorImpl;
|
|
|
|
|
2019-03-10 19:39:17 +00:00
|
|
|
import org.jsoup.nodes.Attribute;
|
2020-02-02 12:03:06 +00:00
|
|
|
import org.jsoup.nodes.Comment;
|
2018-08-02 13:33:06 +00:00
|
|
|
import org.jsoup.nodes.Document;
|
2018-08-28 09:10:31 +00:00
|
|
|
import org.jsoup.nodes.Element;
|
2018-08-02 13:33:06 +00:00
|
|
|
import org.jsoup.nodes.Node;
|
|
|
|
import org.jsoup.nodes.TextNode;
|
2019-03-12 09:04:16 +00:00
|
|
|
import org.jsoup.safety.Cleaner;
|
2018-08-28 12:52:33 +00:00
|
|
|
import org.jsoup.safety.Whitelist;
|
2020-02-02 12:03:06 +00:00
|
|
|
import org.jsoup.select.NodeFilter;
|
2018-08-02 13:33:06 +00:00
|
|
|
import org.jsoup.select.NodeTraversor;
|
|
|
|
import org.jsoup.select.NodeVisitor;
|
2020-04-20 13:01:05 +00:00
|
|
|
import org.w3c.css.sac.CSSException;
|
|
|
|
import org.w3c.css.sac.CSSParseException;
|
|
|
|
import org.w3c.css.sac.ErrorHandler;
|
|
|
|
import org.w3c.css.sac.InputSource;
|
|
|
|
import org.w3c.css.sac.Selector;
|
|
|
|
import org.w3c.dom.css.CSSRule;
|
|
|
|
import org.w3c.dom.css.CSSRuleList;
|
|
|
|
import org.w3c.dom.css.CSSStyleSheet;
|
2020-04-21 07:04:55 +00:00
|
|
|
import org.w3c.dom.stylesheets.MediaList;
|
2018-08-02 13:33:06 +00:00
|
|
|
|
2019-10-04 21:04:03 +00:00
|
|
|
import java.io.ByteArrayOutputStream;
|
2018-12-14 09:11:45 +00:00
|
|
|
import java.io.File;
|
2020-02-28 09:01:18 +00:00
|
|
|
import java.io.FileInputStream;
|
2018-12-14 09:11:45 +00:00
|
|
|
import java.io.IOException;
|
2020-02-28 09:01:18 +00:00
|
|
|
import java.io.InputStream;
|
2020-04-20 13:01:05 +00:00
|
|
|
import java.io.StringReader;
|
2019-09-13 11:46:52 +00:00
|
|
|
import java.util.ArrayList;
|
2019-01-05 11:17:33 +00:00
|
|
|
import java.util.Arrays;
|
2019-03-14 19:33:01 +00:00
|
|
|
import java.util.Collections;
|
2020-01-22 11:28:39 +00:00
|
|
|
import java.util.HashMap;
|
2019-01-05 11:17:33 +00:00
|
|
|
import java.util.List;
|
2019-09-23 20:07:22 +00:00
|
|
|
import java.util.Locale;
|
2020-02-20 09:07:01 +00:00
|
|
|
import java.util.Map;
|
2018-08-05 08:53:43 +00:00
|
|
|
import java.util.regex.Matcher;
|
2019-06-05 08:23:41 +00:00
|
|
|
import java.util.regex.Pattern;
|
2018-08-02 13:33:06 +00:00
|
|
|
|
2019-03-06 10:39:10 +00:00
|
|
|
import static androidx.core.text.HtmlCompat.FROM_HTML_SEPARATOR_LINE_BREAK_LIST_ITEM;
|
2019-02-10 12:01:21 +00:00
|
|
|
import static androidx.core.text.HtmlCompat.TO_HTML_PARAGRAPH_LINES_CONSECUTIVE;
|
2020-04-20 13:01:05 +00:00
|
|
|
import static org.w3c.css.sac.Condition.SAC_CLASS_CONDITION;
|
2019-02-10 12:01:21 +00:00
|
|
|
|
2018-09-12 11:54:16 +00:00
|
|
|
public class HtmlHelper {
|
2019-10-20 17:35:31 +00:00
|
|
|
private static final int PREVIEW_SIZE = 500; // characters
|
2019-02-19 16:21:25 +00:00
|
|
|
|
2020-02-20 10:37:40 +00:00
|
|
|
private static final int DEFAULT_FONT_SIZE = 16; // pixels
|
2020-04-20 07:57:42 +00:00
|
|
|
private static final float FONT_SMALL = 0.8f;
|
|
|
|
private static final float FONT_LARGE = 1.25f;
|
2019-09-25 07:41:10 +00:00
|
|
|
private static final float MIN_LUMINANCE = 0.5f;
|
2019-11-14 08:15:18 +00:00
|
|
|
private static final int TAB_SIZE = 2;
|
2019-09-01 07:44:03 +00:00
|
|
|
private static final int MAX_AUTO_LINK = 250;
|
2020-02-14 10:06:48 +00:00
|
|
|
private static final int MAX_FORMAT_TEXT_SIZE = 50 * 1024; // characters
|
|
|
|
private static final int MAX_FULL_TEXT_SIZE = 1024 * 1024; // characters
|
2019-08-20 18:05:11 +00:00
|
|
|
private static final int TRACKING_PIXEL_SURFACE = 25; // pixels
|
2019-05-13 09:03:15 +00:00
|
|
|
|
2020-01-22 11:28:39 +00:00
|
|
|
private static final HashMap<String, Integer> x11ColorMap = new HashMap<>();
|
|
|
|
|
|
|
|
static {
|
|
|
|
// https://www.w3.org/TR/css-color-3/
|
|
|
|
x11ColorMap.put("aliceblue", 0xF0F8FF);
|
|
|
|
x11ColorMap.put("antiquewhite", 0xFAEBD7);
|
|
|
|
x11ColorMap.put("aqua", 0x00FFFF);
|
|
|
|
x11ColorMap.put("aquamarine", 0x7FFFD4);
|
|
|
|
x11ColorMap.put("azure", 0xF0FFFF);
|
|
|
|
x11ColorMap.put("beige", 0xF5F5DC);
|
|
|
|
x11ColorMap.put("bisque", 0xFFE4C4);
|
|
|
|
x11ColorMap.put("black", 0x000000);
|
|
|
|
x11ColorMap.put("blanchedalmond", 0xFFEBCD);
|
|
|
|
x11ColorMap.put("blue", 0x0000FF);
|
|
|
|
x11ColorMap.put("blueviolet", 0x8A2BE2);
|
|
|
|
x11ColorMap.put("brown", 0xA52A2A);
|
|
|
|
x11ColorMap.put("burlywood", 0xDEB887);
|
|
|
|
x11ColorMap.put("cadetblue", 0x5F9EA0);
|
|
|
|
x11ColorMap.put("chartreuse", 0x7FFF00);
|
|
|
|
x11ColorMap.put("chocolate", 0xD2691E);
|
|
|
|
x11ColorMap.put("coral", 0xFF7F50);
|
|
|
|
x11ColorMap.put("cornflowerblue", 0x6495ED);
|
|
|
|
x11ColorMap.put("cornsilk", 0xFFF8DC);
|
|
|
|
x11ColorMap.put("crimson", 0xDC143C);
|
|
|
|
x11ColorMap.put("cyan", 0x00FFFF);
|
|
|
|
x11ColorMap.put("darkblue", 0x00008B);
|
|
|
|
x11ColorMap.put("darkcyan", 0x008B8B);
|
|
|
|
x11ColorMap.put("darkgoldenrod", 0xB8860B);
|
|
|
|
x11ColorMap.put("darkgray", 0xA9A9A9);
|
|
|
|
x11ColorMap.put("darkgreen", 0x006400);
|
|
|
|
x11ColorMap.put("darkgrey", 0xA9A9A9);
|
|
|
|
x11ColorMap.put("darkkhaki", 0xBDB76B);
|
|
|
|
x11ColorMap.put("darkmagenta", 0x8B008B);
|
|
|
|
x11ColorMap.put("darkolivegreen", 0x556B2F);
|
|
|
|
x11ColorMap.put("darkorange", 0xFF8C00);
|
|
|
|
x11ColorMap.put("darkorchid", 0x9932CC);
|
|
|
|
x11ColorMap.put("darkred", 0x8B0000);
|
|
|
|
x11ColorMap.put("darksalmon", 0xE9967A);
|
|
|
|
x11ColorMap.put("darkseagreen", 0x8FBC8F);
|
|
|
|
x11ColorMap.put("darkslateblue", 0x483D8B);
|
|
|
|
x11ColorMap.put("darkslategray", 0x2F4F4F);
|
|
|
|
x11ColorMap.put("darkslategrey", 0x2F4F4F);
|
|
|
|
x11ColorMap.put("darkturquoise", 0x00CED1);
|
|
|
|
x11ColorMap.put("darkviolet", 0x9400D3);
|
|
|
|
x11ColorMap.put("deeppink", 0xFF1493);
|
|
|
|
x11ColorMap.put("deepskyblue", 0x00BFFF);
|
|
|
|
x11ColorMap.put("dimgray", 0x696969);
|
|
|
|
x11ColorMap.put("dimgrey", 0x696969);
|
|
|
|
x11ColorMap.put("dodgerblue", 0x1E90FF);
|
|
|
|
x11ColorMap.put("firebrick", 0xB22222);
|
|
|
|
x11ColorMap.put("floralwhite", 0xFFFAF0);
|
|
|
|
x11ColorMap.put("forestgreen", 0x228B22);
|
|
|
|
x11ColorMap.put("fuchsia", 0xFF00FF);
|
|
|
|
x11ColorMap.put("gainsboro", 0xDCDCDC);
|
|
|
|
x11ColorMap.put("ghostwhite", 0xF8F8FF);
|
|
|
|
x11ColorMap.put("gold", 0xFFD700);
|
|
|
|
x11ColorMap.put("goldenrod", 0xDAA520);
|
|
|
|
x11ColorMap.put("gray", 0x808080);
|
|
|
|
x11ColorMap.put("green", 0x008000);
|
|
|
|
x11ColorMap.put("greenyellow", 0xADFF2F);
|
|
|
|
x11ColorMap.put("grey", 0x808080);
|
|
|
|
x11ColorMap.put("honeydew", 0xF0FFF0);
|
|
|
|
x11ColorMap.put("hotpink", 0xFF69B4);
|
|
|
|
x11ColorMap.put("indianred", 0xCD5C5C);
|
|
|
|
x11ColorMap.put("indigo", 0x4B0082);
|
|
|
|
x11ColorMap.put("ivory", 0xFFFFF0);
|
|
|
|
x11ColorMap.put("khaki", 0xF0E68C);
|
|
|
|
x11ColorMap.put("lavender", 0xE6E6FA);
|
|
|
|
x11ColorMap.put("lavenderblush", 0xFFF0F5);
|
|
|
|
x11ColorMap.put("lawngreen", 0x7CFC00);
|
|
|
|
x11ColorMap.put("lemonchiffon", 0xFFFACD);
|
|
|
|
x11ColorMap.put("lightblue", 0xADD8E6);
|
|
|
|
x11ColorMap.put("lightcoral", 0xF08080);
|
|
|
|
x11ColorMap.put("lightcyan", 0xE0FFFF);
|
|
|
|
x11ColorMap.put("lightgoldenrodyellow", 0xFAFAD2);
|
|
|
|
x11ColorMap.put("lightgray", 0xD3D3D3);
|
|
|
|
x11ColorMap.put("lightgreen", 0x90EE90);
|
|
|
|
x11ColorMap.put("lightgrey", 0xD3D3D3);
|
|
|
|
x11ColorMap.put("lightpink", 0xFFB6C1);
|
|
|
|
x11ColorMap.put("lightsalmon", 0xFFA07A);
|
|
|
|
x11ColorMap.put("lightseagreen", 0x20B2AA);
|
|
|
|
x11ColorMap.put("lightskyblue", 0x87CEFA);
|
|
|
|
x11ColorMap.put("lightslategray", 0x778899);
|
|
|
|
x11ColorMap.put("lightslategrey", 0x778899);
|
|
|
|
x11ColorMap.put("lightsteelblue", 0xB0C4DE);
|
|
|
|
x11ColorMap.put("lightyellow", 0xFFFFE0);
|
|
|
|
x11ColorMap.put("lime", 0x00FF00);
|
|
|
|
x11ColorMap.put("limegreen", 0x32CD32);
|
|
|
|
x11ColorMap.put("linen", 0xFAF0E6);
|
|
|
|
x11ColorMap.put("magenta", 0xFF00FF);
|
|
|
|
x11ColorMap.put("maroon", 0x800000);
|
|
|
|
x11ColorMap.put("mediumaquamarine", 0x66CDAA);
|
|
|
|
x11ColorMap.put("mediumblue", 0x0000CD);
|
|
|
|
x11ColorMap.put("mediumorchid", 0xBA55D3);
|
|
|
|
x11ColorMap.put("mediumpurple", 0x9370DB);
|
|
|
|
x11ColorMap.put("mediumseagreen", 0x3CB371);
|
|
|
|
x11ColorMap.put("mediumslateblue", 0x7B68EE);
|
|
|
|
x11ColorMap.put("mediumspringgreen", 0x00FA9A);
|
|
|
|
x11ColorMap.put("mediumturquoise", 0x48D1CC);
|
|
|
|
x11ColorMap.put("mediumvioletred", 0xC71585);
|
|
|
|
x11ColorMap.put("midnightblue", 0x191970);
|
|
|
|
x11ColorMap.put("mintcream", 0xF5FFFA);
|
|
|
|
x11ColorMap.put("mistyrose", 0xFFE4E1);
|
|
|
|
x11ColorMap.put("moccasin", 0xFFE4B5);
|
|
|
|
x11ColorMap.put("navajowhite", 0xFFDEAD);
|
|
|
|
x11ColorMap.put("navy", 0x000080);
|
|
|
|
x11ColorMap.put("oldlace", 0xFDF5E6);
|
|
|
|
x11ColorMap.put("olive", 0x808000);
|
|
|
|
x11ColorMap.put("olivedrab", 0x6B8E23);
|
|
|
|
x11ColorMap.put("orange", 0xFFA500);
|
|
|
|
x11ColorMap.put("orangered", 0xFF4500);
|
|
|
|
x11ColorMap.put("orchid", 0xDA70D6);
|
|
|
|
x11ColorMap.put("palegoldenrod", 0xEEE8AA);
|
|
|
|
x11ColorMap.put("palegreen", 0x98FB98);
|
|
|
|
x11ColorMap.put("paleturquoise", 0xAFEEEE);
|
|
|
|
x11ColorMap.put("palevioletred", 0xDB7093);
|
|
|
|
x11ColorMap.put("papayawhip", 0xFFEFD5);
|
|
|
|
x11ColorMap.put("peachpuff", 0xFFDAB9);
|
|
|
|
x11ColorMap.put("peru", 0xCD853F);
|
|
|
|
x11ColorMap.put("pink", 0xFFC0CB);
|
|
|
|
x11ColorMap.put("plum", 0xDDA0DD);
|
|
|
|
x11ColorMap.put("powderblue", 0xB0E0E6);
|
|
|
|
x11ColorMap.put("purple", 0x800080);
|
|
|
|
x11ColorMap.put("red", 0xFF0000);
|
|
|
|
x11ColorMap.put("rosybrown", 0xBC8F8F);
|
|
|
|
x11ColorMap.put("royalblue", 0x4169E1);
|
|
|
|
x11ColorMap.put("saddlebrown", 0x8B4513);
|
|
|
|
x11ColorMap.put("salmon", 0xFA8072);
|
|
|
|
x11ColorMap.put("sandybrown", 0xF4A460);
|
|
|
|
x11ColorMap.put("seagreen", 0x2E8B57);
|
|
|
|
x11ColorMap.put("seashell", 0xFFF5EE);
|
|
|
|
x11ColorMap.put("sienna", 0xA0522D);
|
|
|
|
x11ColorMap.put("silver", 0xC0C0C0);
|
|
|
|
x11ColorMap.put("skyblue", 0x87CEEB);
|
|
|
|
x11ColorMap.put("slateblue", 0x6A5ACD);
|
|
|
|
x11ColorMap.put("slategray", 0x708090);
|
|
|
|
x11ColorMap.put("slategrey", 0x708090);
|
|
|
|
x11ColorMap.put("snow", 0xFFFAFA);
|
|
|
|
x11ColorMap.put("springgreen", 0x00FF7F);
|
|
|
|
x11ColorMap.put("steelblue", 0x4682B4);
|
|
|
|
x11ColorMap.put("tan", 0xD2B48C);
|
|
|
|
x11ColorMap.put("teal", 0x008080);
|
|
|
|
x11ColorMap.put("thistle", 0xD8BFD8);
|
|
|
|
x11ColorMap.put("tomato", 0xFF6347);
|
|
|
|
x11ColorMap.put("turquoise", 0x40E0D0);
|
|
|
|
x11ColorMap.put("violet", 0xEE82EE);
|
|
|
|
x11ColorMap.put("wheat", 0xF5DEB3);
|
|
|
|
x11ColorMap.put("white", 0xFFFFFF);
|
|
|
|
x11ColorMap.put("whitesmoke", 0xF5F5F5);
|
|
|
|
x11ColorMap.put("yellow", 0xFFFF00);
|
|
|
|
x11ColorMap.put("yellowgreen", 0x9ACD32);
|
|
|
|
}
|
|
|
|
|
2020-03-25 19:25:06 +00:00
|
|
|
static Document sanitizeCompose(Context context, String html, boolean show_images) {
|
|
|
|
try {
|
|
|
|
Document parsed = JsoupEx.parse(html);
|
|
|
|
return sanitize(context, parsed, false, show_images);
|
|
|
|
} catch (Throwable ex) {
|
|
|
|
// OutOfMemoryError
|
|
|
|
Log.e(ex);
|
|
|
|
Document document = Document.createShell("");
|
|
|
|
Element strong = document.createElement("strong");
|
|
|
|
strong.text(Log.formatThrowable(ex));
|
|
|
|
document.body().appendChild(strong);
|
|
|
|
return document;
|
|
|
|
}
|
2020-02-14 08:41:28 +00:00
|
|
|
}
|
|
|
|
|
2020-03-25 19:25:06 +00:00
|
|
|
static Document sanitizeView(Context context, Document parsed, boolean show_images) {
|
2019-10-20 12:15:20 +00:00
|
|
|
try {
|
2020-03-25 19:25:06 +00:00
|
|
|
return sanitize(context, parsed, true, show_images);
|
2019-10-20 12:15:20 +00:00
|
|
|
} catch (Throwable ex) {
|
|
|
|
// OutOfMemoryError
|
|
|
|
Log.e(ex);
|
2019-11-22 18:16:02 +00:00
|
|
|
Document document = Document.createShell("");
|
2019-11-19 20:53:12 +00:00
|
|
|
Element strong = document.createElement("strong");
|
2019-12-06 07:50:46 +00:00
|
|
|
strong.text(Log.formatThrowable(ex));
|
2019-11-22 18:16:02 +00:00
|
|
|
document.body().appendChild(strong);
|
2019-11-19 20:53:12 +00:00
|
|
|
return document;
|
2019-10-20 12:15:20 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-03-25 19:25:06 +00:00
|
|
|
private static Document sanitize(Context context, Document parsed, boolean view, boolean show_images) {
|
2019-10-04 13:25:04 +00:00
|
|
|
SharedPreferences prefs = PreferenceManager.getDefaultSharedPreferences(context);
|
|
|
|
boolean text_color = prefs.getBoolean("text_color", true);
|
2020-02-20 15:08:33 +00:00
|
|
|
boolean text_size = prefs.getBoolean("text_size", true);
|
2019-10-16 09:05:38 +00:00
|
|
|
boolean display_hidden = prefs.getBoolean("display_hidden", false);
|
2019-10-04 13:25:04 +00:00
|
|
|
boolean disable_tracking = prefs.getBoolean("disable_tracking", true);
|
|
|
|
|
2020-02-09 14:04:35 +00:00
|
|
|
// https://chromium.googlesource.com/chromium/blink/+/master/Source/core/css/html.css
|
2019-05-13 09:03:15 +00:00
|
|
|
|
2020-02-02 12:03:06 +00:00
|
|
|
// <!--[if ...]><!--> ... <!--<![endif]-->
|
2020-02-04 09:10:36 +00:00
|
|
|
// https://docs.microsoft.com/en-us/previous-versions/windows/internet-explorer/ie-developer/compatibility/hh801214(v=vs.85)
|
2020-02-03 11:31:48 +00:00
|
|
|
if (!display_hidden && false)
|
2020-02-02 12:03:06 +00:00
|
|
|
parsed.filter(new NodeFilter() {
|
|
|
|
private boolean remove = false;
|
|
|
|
|
|
|
|
@Override
|
|
|
|
public FilterResult head(Node node, int depth) {
|
|
|
|
if (node instanceof Comment) {
|
|
|
|
String data = ((Comment) node).getData().trim();
|
|
|
|
if (data.startsWith("[if") && !data.endsWith("endif]")) {
|
|
|
|
remove = true;
|
|
|
|
return FilterResult.REMOVE;
|
|
|
|
} else if (remove && data.endsWith("endif]")) {
|
|
|
|
remove = false;
|
|
|
|
return FilterResult.REMOVE;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return (remove ? FilterResult.REMOVE : FilterResult.CONTINUE);
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
|
|
|
public FilterResult tail(Node node, int depth) {
|
|
|
|
return FilterResult.CONTINUE;
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
2019-05-13 09:03:15 +00:00
|
|
|
// <html xmlns:v="urn:schemas-microsoft-com:vml"
|
|
|
|
// xmlns:o="urn:schemas-microsoft-com:office:office"
|
|
|
|
// xmlns:w="urn:schemas-microsoft-com:office:word"
|
|
|
|
// xmlns:m="http://schemas.microsoft.com/office/2004/12/omml"
|
|
|
|
// xmlns="http://www.w3.org/TR/REC-html40">
|
|
|
|
|
|
|
|
// <o:p> </o:p></span>
|
|
|
|
|
|
|
|
// Default XHTML namespace: http://www.w3.org/1999/xhtml
|
|
|
|
|
|
|
|
String ns = null;
|
|
|
|
for (Element h : parsed.select("html"))
|
|
|
|
for (Attribute a : h.attributes()) {
|
2019-05-15 09:18:14 +00:00
|
|
|
String key = a.getKey();
|
|
|
|
String value = a.getValue();
|
|
|
|
if (value != null &&
|
|
|
|
key.startsWith("xmlns:") &&
|
|
|
|
value.startsWith("http://www.w3.org/")) {
|
|
|
|
ns = key.split(":")[1];
|
2019-05-13 09:03:15 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2019-05-15 09:18:14 +00:00
|
|
|
for (Element e : parsed.select("*")) {
|
|
|
|
String tag = e.tagName();
|
|
|
|
if (tag.contains(":")) {
|
|
|
|
if (ns != null && tag.startsWith(ns)) {
|
2019-05-13 09:03:15 +00:00
|
|
|
e.tagName(tag.split(":")[1]);
|
|
|
|
Log.i("Updated tag=" + tag + " to=" + e.tagName());
|
|
|
|
} else {
|
|
|
|
e.remove();
|
|
|
|
Log.i("Removed tag=" + tag);
|
|
|
|
}
|
|
|
|
}
|
2019-05-15 09:18:14 +00:00
|
|
|
}
|
2019-05-13 09:03:15 +00:00
|
|
|
|
2020-02-14 08:04:16 +00:00
|
|
|
// Limit length
|
2020-03-25 19:25:06 +00:00
|
|
|
if (view && truncate(parsed, true)) {
|
2020-02-14 08:04:16 +00:00
|
|
|
parsed.body()
|
2020-02-16 09:56:27 +00:00
|
|
|
.appendElement("br")
|
2020-02-14 08:04:16 +00:00
|
|
|
.appendElement("p")
|
|
|
|
.appendElement("em")
|
|
|
|
.text(context.getString(R.string.title_too_large));
|
2020-03-25 19:25:06 +00:00
|
|
|
parsed.body()
|
|
|
|
.appendElement("p")
|
|
|
|
.appendElement("big")
|
|
|
|
.appendElement("a")
|
|
|
|
.attr("href", "full:")
|
|
|
|
.text(context.getString(R.string.title_show_full));
|
2020-02-14 08:04:16 +00:00
|
|
|
}
|
|
|
|
|
2020-04-20 13:01:05 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/style
|
2020-04-21 07:04:55 +00:00
|
|
|
List<CSSStyleSheet> sheets = new ArrayList<>();
|
2020-04-20 13:01:05 +00:00
|
|
|
for (Element style : parsed.head().select("style")) {
|
|
|
|
Log.i("Style=" + style.data());
|
|
|
|
try {
|
|
|
|
InputSource source = new InputSource(new StringReader(style.data()));
|
2020-04-21 07:04:55 +00:00
|
|
|
String media = style.attr("media");
|
|
|
|
if (!TextUtils.isEmpty(media))
|
|
|
|
source.setMedia(media);
|
|
|
|
|
2020-04-20 13:01:05 +00:00
|
|
|
CSSOMParser parser = new CSSOMParser(new SACParserCSS3());
|
|
|
|
parser.setErrorHandler(new ErrorHandler() {
|
|
|
|
@Override
|
|
|
|
public void warning(CSSParseException ex) throws CSSException {
|
|
|
|
Log.w(ex);
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
|
|
|
public void error(CSSParseException ex) throws CSSException {
|
|
|
|
Log.e(ex);
|
|
|
|
}
|
|
|
|
|
|
|
|
@Override
|
|
|
|
public void fatalError(CSSParseException ex) throws CSSException {
|
|
|
|
Log.e(ex);
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
2020-04-21 07:04:55 +00:00
|
|
|
sheets.add(parser.parseStyleSheet(source, null, null));
|
2020-04-20 13:01:05 +00:00
|
|
|
} catch (Throwable ex) {
|
|
|
|
Log.w(ex);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-03-12 09:04:16 +00:00
|
|
|
Whitelist whitelist = Whitelist.relaxed()
|
2020-02-08 19:57:37 +00:00
|
|
|
.addTags("hr", "abbr", "big", "font", "dfn", "del", "s", "tt")
|
2020-04-20 13:01:05 +00:00
|
|
|
.addAttributes(":all", "class")
|
2020-02-20 15:08:33 +00:00
|
|
|
.addAttributes(":all", "style")
|
2020-04-20 07:57:42 +00:00
|
|
|
.addAttributes("font", "size")
|
2019-03-10 15:21:46 +00:00
|
|
|
.removeTags("col", "colgroup", "thead", "tbody")
|
2019-03-12 09:04:16 +00:00
|
|
|
.removeAttributes("table", "width")
|
|
|
|
.removeAttributes("td", "colspan", "rowspan", "width")
|
|
|
|
.removeAttributes("th", "colspan", "rowspan", "width")
|
2018-12-14 09:05:48 +00:00
|
|
|
.addProtocols("img", "src", "cid")
|
2020-02-14 08:04:16 +00:00
|
|
|
.addProtocols("img", "src", "data")
|
|
|
|
.addProtocols("a", "href", "full");
|
2019-09-23 18:13:38 +00:00
|
|
|
if (text_color)
|
2019-09-25 10:48:02 +00:00
|
|
|
whitelist
|
|
|
|
.addAttributes("font", "color");
|
2019-09-23 18:13:38 +00:00
|
|
|
|
2019-03-12 09:04:16 +00:00
|
|
|
final Document document = new Cleaner(whitelist).clean(parsed);
|
2018-11-24 11:27:44 +00:00
|
|
|
|
2019-09-24 12:46:12 +00:00
|
|
|
boolean dark = Helper.isDarkTheme(context);
|
|
|
|
|
2019-09-25 10:48:02 +00:00
|
|
|
// Font
|
|
|
|
for (Element font : document.select("font")) {
|
2020-04-20 07:57:42 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/font
|
2019-09-25 10:48:02 +00:00
|
|
|
String color = font.attr("color");
|
2020-04-20 07:57:42 +00:00
|
|
|
String size = font.attr("size");
|
|
|
|
|
2019-09-25 13:20:27 +00:00
|
|
|
if (Build.VERSION.SDK_INT >= Build.VERSION_CODES.N)
|
|
|
|
font.removeAttr("color");
|
2020-04-20 07:57:42 +00:00
|
|
|
font.removeAttr("size");
|
|
|
|
|
|
|
|
StringBuilder sb = new StringBuilder();
|
|
|
|
|
|
|
|
if (!TextUtils.isEmpty(color))
|
|
|
|
sb.append("color:").append(color).append(";");
|
|
|
|
|
|
|
|
if (!TextUtils.isEmpty(size)) {
|
|
|
|
try {
|
|
|
|
int s = Integer.parseInt(size);
|
|
|
|
if (s < 3)
|
|
|
|
size = "small";
|
|
|
|
else if (s > 3)
|
|
|
|
size = "large";
|
|
|
|
else
|
|
|
|
size = "medium";
|
|
|
|
sb.append("font-size:").append(size).append(";");
|
|
|
|
} catch (NumberFormatException ex) {
|
|
|
|
Log.w(ex);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
font.attr("style", sb.toString());
|
|
|
|
|
2019-09-25 10:48:02 +00:00
|
|
|
font.tagName("span");
|
|
|
|
}
|
|
|
|
|
2019-10-16 09:05:38 +00:00
|
|
|
// Sanitize styles
|
|
|
|
for (Element element : document.select("*")) {
|
2020-04-20 13:01:05 +00:00
|
|
|
String clazz = element.attr("class");
|
2020-04-21 18:29:58 +00:00
|
|
|
|
|
|
|
// This is to workaround a TextView bug
|
|
|
|
List<Element> parents = element.parents();
|
|
|
|
Collections.reverse(parents);
|
|
|
|
String style = null;
|
|
|
|
for (Element parent : parents)
|
|
|
|
style = mergeStyles(style, parent.attr("style"), "color");
|
|
|
|
|
|
|
|
style = mergeStyles(style, element.attr("style"));
|
2020-04-20 13:01:05 +00:00
|
|
|
|
|
|
|
// Process class
|
2020-04-21 07:04:55 +00:00
|
|
|
if (!TextUtils.isEmpty(clazz))
|
|
|
|
style = processClass(clazz, style, sheets);
|
2020-04-20 13:01:05 +00:00
|
|
|
|
|
|
|
// Process style
|
2019-09-23 17:51:17 +00:00
|
|
|
if (!TextUtils.isEmpty(style)) {
|
|
|
|
StringBuilder sb = new StringBuilder();
|
|
|
|
|
|
|
|
String[] params = style.split(";");
|
|
|
|
for (String param : params) {
|
2020-04-20 13:01:05 +00:00
|
|
|
int colon = param.indexOf(':');
|
|
|
|
if (colon > 0) {
|
|
|
|
String key = param.substring(0, colon).trim().toLowerCase(Locale.ROOT);
|
|
|
|
String value = param.substring(colon + 1).toLowerCase(Locale.ROOT)
|
2020-02-02 10:11:44 +00:00
|
|
|
.replace("!important", "")
|
2020-02-02 12:01:46 +00:00
|
|
|
.trim()
|
2020-02-02 10:11:44 +00:00
|
|
|
.replaceAll("\\s+", " ");
|
2019-10-16 09:05:38 +00:00
|
|
|
switch (key) {
|
2019-09-23 17:51:17 +00:00
|
|
|
case "color":
|
2020-02-09 09:31:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/CSS/color
|
2020-02-20 15:08:33 +00:00
|
|
|
if (!text_color)
|
|
|
|
continue;
|
|
|
|
|
2020-01-31 12:52:57 +00:00
|
|
|
Integer color = parseColor(value, dark);
|
|
|
|
if (color != null) {
|
2020-02-08 17:45:28 +00:00
|
|
|
// fromHtml does not support transparency
|
2020-02-15 18:22:28 +00:00
|
|
|
String c = String.format("#%06x", color);
|
2019-09-24 12:46:12 +00:00
|
|
|
sb.append("color:").append(c).append(";");
|
2019-09-25 13:20:27 +00:00
|
|
|
if (Build.VERSION.SDK_INT < Build.VERSION_CODES.N)
|
2019-10-16 09:05:38 +00:00
|
|
|
element.attr("color", c);
|
2019-09-24 12:46:12 +00:00
|
|
|
}
|
2020-02-20 15:08:33 +00:00
|
|
|
|
2019-09-23 17:51:17 +00:00
|
|
|
break;
|
2019-09-23 20:07:22 +00:00
|
|
|
|
2020-02-09 09:31:37 +00:00
|
|
|
case "font-size":
|
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/CSS/font-size
|
2020-02-20 15:08:33 +00:00
|
|
|
if (!text_size)
|
|
|
|
continue;
|
|
|
|
|
2020-02-20 10:28:55 +00:00
|
|
|
Element parent = element.parent();
|
|
|
|
if (parent != null) {
|
2020-02-20 10:30:43 +00:00
|
|
|
boolean set = false;
|
|
|
|
boolean small = false;
|
|
|
|
boolean big = false;
|
2020-02-20 10:28:55 +00:00
|
|
|
Integer current = null;
|
|
|
|
while (parent != null) {
|
2020-02-20 10:30:43 +00:00
|
|
|
if (!set) {
|
|
|
|
if ("small".equals(parent.tagName())) {
|
|
|
|
set = true;
|
|
|
|
small = true;
|
|
|
|
}
|
|
|
|
if ("big".equals(parent.tagName())) {
|
|
|
|
set = true;
|
|
|
|
big = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-02-20 10:28:55 +00:00
|
|
|
String xFontSize = parent.attr("x-font-size");
|
|
|
|
if (!TextUtils.isEmpty(xFontSize)) {
|
|
|
|
current = Integer.parseInt(xFontSize);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
parent = parent.parent();
|
|
|
|
}
|
|
|
|
|
|
|
|
Float fsize = getFontSize(value, current);
|
2020-02-10 08:29:47 +00:00
|
|
|
if (fsize != null && fsize != 0 &&
|
2020-04-20 07:57:42 +00:00
|
|
|
((!small && fsize <= FONT_SMALL) || (!big && fsize >= FONT_LARGE))) {
|
2020-02-10 08:29:47 +00:00
|
|
|
Element e = new Element(fsize < 1 ? "small" : "big");
|
2020-02-20 10:37:40 +00:00
|
|
|
int px = Math.round(DEFAULT_FONT_SIZE * fsize);
|
|
|
|
e.attr("x-font-size", Integer.toString(px));
|
2020-02-10 08:29:47 +00:00
|
|
|
element.replaceWith(e);
|
|
|
|
e.appendChild(element);
|
|
|
|
}
|
2020-02-09 09:31:37 +00:00
|
|
|
}
|
2020-02-20 15:08:33 +00:00
|
|
|
|
2020-02-09 09:31:37 +00:00
|
|
|
break;
|
|
|
|
|
2020-02-08 19:39:51 +00:00
|
|
|
case "font-weight":
|
2020-02-09 09:31:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/CSS/font-weight
|
2020-02-10 08:29:47 +00:00
|
|
|
if (element.parent() != null) {
|
|
|
|
Integer fweight = getFontWeight(value);
|
|
|
|
if (fweight != null && fweight >= 600) {
|
|
|
|
Element strong = new Element("strong");
|
|
|
|
element.replaceWith(strong);
|
|
|
|
strong.appendChild(element);
|
|
|
|
}
|
2020-02-08 19:39:51 +00:00
|
|
|
}
|
2019-09-23 20:07:22 +00:00
|
|
|
break;
|
2019-09-24 12:46:12 +00:00
|
|
|
|
2020-02-09 09:31:37 +00:00
|
|
|
case "text-decoration":
|
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/CSS/text-decoration
|
|
|
|
if (value.contains("line-through"))
|
|
|
|
sb.append("text-decoration:line-through;");
|
2019-09-24 12:46:12 +00:00
|
|
|
break;
|
2019-10-16 09:05:38 +00:00
|
|
|
|
|
|
|
case "display":
|
2020-02-09 09:31:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/CSS/display
|
2020-02-10 18:55:52 +00:00
|
|
|
if (element.parent() != null &&
|
|
|
|
!display_hidden && "none".equals(value)) {
|
|
|
|
Log.i("Removing display none " + element.tagName());
|
|
|
|
element.remove();
|
2019-10-16 09:05:38 +00:00
|
|
|
}
|
2020-02-05 09:31:20 +00:00
|
|
|
if ("inline".equals(value) || "inline-block".equals(value)) {
|
|
|
|
if (element.nextSibling() != null)
|
|
|
|
element.attr("inline", "true");
|
|
|
|
}
|
2019-10-16 09:05:38 +00:00
|
|
|
break;
|
2019-11-26 08:15:33 +00:00
|
|
|
|
|
|
|
case "height":
|
|
|
|
case "width":
|
|
|
|
//case "font-size":
|
|
|
|
//case "line-height":
|
2020-02-10 18:55:52 +00:00
|
|
|
if (element.parent() != null && !display_hidden) {
|
2020-02-20 10:28:55 +00:00
|
|
|
Float s = getFontSize(value, null);
|
2020-02-09 09:31:37 +00:00
|
|
|
if (s != null && s == 0) {
|
2020-02-10 18:55:52 +00:00
|
|
|
Log.i("Removing no height/width " + element.tagName());
|
|
|
|
element.remove();
|
2020-02-09 09:31:37 +00:00
|
|
|
}
|
2019-11-26 08:15:33 +00:00
|
|
|
}
|
|
|
|
break;
|
2020-04-13 17:31:02 +00:00
|
|
|
|
2020-04-21 10:27:32 +00:00
|
|
|
case "margin":
|
|
|
|
case "padding":
|
|
|
|
case "margin-top":
|
|
|
|
case "margin-bottom":
|
2020-04-13 17:31:02 +00:00
|
|
|
case "padding-top":
|
|
|
|
case "padding-bottom":
|
2020-04-21 10:27:32 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/CSS/margin
|
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/CSS/padding
|
2020-04-14 08:26:39 +00:00
|
|
|
if (element.isBlock() && hasVisibleContent(element.childNodes())) {
|
2020-04-21 10:27:32 +00:00
|
|
|
Float[] p = new Float[4];
|
|
|
|
|
|
|
|
String[] v = value.split(" ");
|
|
|
|
for (int i = 0; i < v.length; i++)
|
|
|
|
p[i] = getFontSize(v[i], null);
|
|
|
|
|
|
|
|
if (v.length == 1) {
|
|
|
|
p[1] = p[0];
|
|
|
|
p[2] = p[0];
|
|
|
|
p[3] = p[0];
|
|
|
|
} else if (v.length == 2) {
|
|
|
|
p[2] = p[0];
|
|
|
|
p[3] = p[1];
|
|
|
|
}
|
|
|
|
|
|
|
|
if (key.endsWith("top"))
|
|
|
|
p[2] = null;
|
|
|
|
else if (key.endsWith("bottom"))
|
|
|
|
p[0] = null;
|
|
|
|
|
2020-04-21 17:44:35 +00:00
|
|
|
if (p[0] != null && p[0] > 0.5)
|
2020-04-21 10:27:32 +00:00
|
|
|
element.attr("line-before", "true");
|
2020-04-21 17:44:35 +00:00
|
|
|
if (p[2] != null && p[2] > 0.5)
|
2020-04-21 10:27:32 +00:00
|
|
|
element.attr("line-after", "true");
|
2020-04-13 17:31:02 +00:00
|
|
|
}
|
|
|
|
break;
|
2019-09-23 17:51:17 +00:00
|
|
|
}
|
2019-10-16 09:05:38 +00:00
|
|
|
}
|
2019-09-23 17:51:17 +00:00
|
|
|
}
|
|
|
|
|
2019-09-25 16:05:13 +00:00
|
|
|
if (sb.length() == 0)
|
2019-10-16 09:05:38 +00:00
|
|
|
element.removeAttr("style");
|
2020-01-31 12:52:57 +00:00
|
|
|
else {
|
2019-10-16 09:05:38 +00:00
|
|
|
element.attr("style", sb.toString());
|
2020-01-31 12:52:57 +00:00
|
|
|
if (BuildConfig.DEBUG)
|
|
|
|
Log.i("Style=" + sb);
|
|
|
|
}
|
2019-09-23 17:51:17 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-02-24 19:34:16 +00:00
|
|
|
// Remove trailing br from div
|
2020-01-20 17:02:40 +00:00
|
|
|
for (Element div : document.select("div"))
|
|
|
|
if (div.children().select("div").size() == 0 &&
|
|
|
|
hasVisibleContent(div.childNodes())) {
|
|
|
|
Node last = div.childNode(div.childNodeSize() - 1);
|
|
|
|
if (last != null && "br".equals(last.nodeName()))
|
|
|
|
last.remove();
|
|
|
|
}
|
|
|
|
|
2020-02-24 19:34:16 +00:00
|
|
|
// Replace headings
|
2020-02-20 15:08:33 +00:00
|
|
|
if (!text_size)
|
|
|
|
for (Element h : document.select("h1,h2,h3,h4,h5,h6")) {
|
|
|
|
h.appendElement("br");
|
|
|
|
h.appendElement("br");
|
|
|
|
h.tagName("strong");
|
|
|
|
}
|
|
|
|
|
2019-09-12 08:45:54 +00:00
|
|
|
// Paragraphs
|
2019-11-11 10:32:47 +00:00
|
|
|
for (Element p : document.select("p")) {
|
|
|
|
p.appendElement("br");
|
2019-09-12 08:45:54 +00:00
|
|
|
p.tagName("div");
|
2019-11-11 10:32:47 +00:00
|
|
|
}
|
2019-09-12 08:45:54 +00:00
|
|
|
|
2020-02-08 19:57:37 +00:00
|
|
|
// Short inline quotes
|
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/q
|
2019-03-10 15:21:46 +00:00
|
|
|
for (Element q : document.select("q")) {
|
2020-02-08 19:57:37 +00:00
|
|
|
q.tagName("a");
|
|
|
|
q.attr("href", q.attr("cite"));
|
|
|
|
q.removeAttr("cite");
|
2019-03-10 15:21:46 +00:00
|
|
|
}
|
|
|
|
|
2020-02-08 19:57:37 +00:00
|
|
|
// Citation
|
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/cite
|
|
|
|
for (Element cite : document.select("cite")) {
|
|
|
|
cite.prependText("\"");
|
|
|
|
cite.appendText("\"");
|
|
|
|
cite.tagName("em");
|
|
|
|
}
|
|
|
|
|
|
|
|
// Definition
|
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/dfn
|
|
|
|
for (Element dfn : document.select("dfn"))
|
|
|
|
dfn.tagName("em");
|
|
|
|
|
2019-03-10 15:21:46 +00:00
|
|
|
// Pre formatted text
|
2020-02-08 19:57:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/pre
|
2019-09-01 09:10:00 +00:00
|
|
|
for (Element pre : document.select("pre")) {
|
2019-11-19 08:57:55 +00:00
|
|
|
pre.html(formatPre(pre.wholeText()));
|
2020-02-06 09:46:17 +00:00
|
|
|
pre.tagName("div");
|
2019-03-10 15:21:46 +00:00
|
|
|
}
|
2019-03-10 11:14:39 +00:00
|
|
|
|
2019-03-10 15:21:46 +00:00
|
|
|
// Code
|
2020-02-08 19:57:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/code
|
2019-09-21 16:10:41 +00:00
|
|
|
document.select("code").tagName("strong");
|
2019-03-10 15:21:46 +00:00
|
|
|
|
|
|
|
// Lines
|
2020-02-08 19:57:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/hr
|
2019-03-10 15:21:46 +00:00
|
|
|
for (Element hr : document.select("hr")) {
|
|
|
|
hr.tagName("div");
|
2019-03-18 18:23:43 +00:00
|
|
|
hr.text("----------------------------------------");
|
2019-02-10 12:01:21 +00:00
|
|
|
}
|
|
|
|
|
2019-03-10 15:21:46 +00:00
|
|
|
// Descriptions
|
2020-02-08 19:57:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/dl
|
2019-03-10 15:21:46 +00:00
|
|
|
document.select("dl").tagName("div");
|
2019-03-11 08:27:56 +00:00
|
|
|
for (Element dt : document.select("dt")) {
|
|
|
|
dt.tagName("strong");
|
2019-03-10 15:21:46 +00:00
|
|
|
dt.appendElement("br");
|
2019-03-11 08:27:56 +00:00
|
|
|
}
|
|
|
|
for (Element dd : document.select("dd")) {
|
|
|
|
dd.tagName("em");
|
|
|
|
dd.appendElement("br").appendElement("br");
|
|
|
|
}
|
2018-11-24 11:27:44 +00:00
|
|
|
|
2019-03-12 12:13:53 +00:00
|
|
|
// Abbreviations
|
2020-02-08 19:57:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/abbr
|
2019-03-12 12:13:53 +00:00
|
|
|
document.select("abbr").tagName("u");
|
|
|
|
|
2019-06-30 07:41:18 +00:00
|
|
|
// Subscript/Superscript
|
2020-02-08 19:57:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/sub
|
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/sup
|
2019-06-30 07:41:18 +00:00
|
|
|
for (Element subp : document.select("sub,sup")) {
|
|
|
|
Element small = document.createElement("small");
|
|
|
|
small.html(subp.html());
|
|
|
|
subp.html(small.outerHtml());
|
|
|
|
}
|
|
|
|
|
|
|
|
// Lists
|
2020-02-08 19:57:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/li
|
2019-06-30 07:41:18 +00:00
|
|
|
for (Element li : document.select("li")) {
|
|
|
|
li.tagName("span");
|
2020-01-30 10:12:26 +00:00
|
|
|
Element parent = li.parent();
|
|
|
|
if (parent == null || "ul".equals(parent.tagName()))
|
|
|
|
li.prependText("• ");
|
|
|
|
else
|
|
|
|
li.prependText((li.elementSiblingIndex() + 1) + ". ");
|
2019-06-30 07:41:18 +00:00
|
|
|
li.appendElement("br"); // line break after list item
|
|
|
|
}
|
|
|
|
document.select("ol").tagName("div");
|
|
|
|
document.select("ul").tagName("div");
|
2018-12-21 14:19:07 +00:00
|
|
|
|
2019-03-30 16:48:04 +00:00
|
|
|
// Tables
|
2020-02-08 19:57:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/table
|
2019-03-30 16:48:04 +00:00
|
|
|
for (Element col : document.select("th,td")) {
|
2019-09-02 17:01:17 +00:00
|
|
|
// separate columns
|
2019-09-12 16:53:57 +00:00
|
|
|
if (hasVisibleContent(col.childNodes()))
|
2019-09-12 08:45:54 +00:00
|
|
|
if (col.nextElementSibling() != null)
|
2019-09-02 17:01:17 +00:00
|
|
|
col.appendText(" ");
|
2019-03-30 16:48:04 +00:00
|
|
|
|
|
|
|
if ("th".equals(col.tagName()))
|
|
|
|
col.tagName("strong");
|
|
|
|
else
|
|
|
|
col.tagName("span");
|
|
|
|
}
|
|
|
|
|
2019-09-12 08:45:54 +00:00
|
|
|
for (Element row : document.select("tr")) {
|
2019-03-30 16:48:04 +00:00
|
|
|
row.tagName("span");
|
2019-09-12 16:53:57 +00:00
|
|
|
if (hasVisibleContent(row.childNodes())) {
|
2019-09-12 13:28:21 +00:00
|
|
|
Element next = row.nextElementSibling();
|
|
|
|
if (next != null && "tr".equals(next.tagName()))
|
|
|
|
row.appendElement("br");
|
|
|
|
}
|
2019-09-12 08:45:54 +00:00
|
|
|
}
|
2019-03-30 16:48:04 +00:00
|
|
|
|
2019-09-11 20:52:15 +00:00
|
|
|
document.select("caption").tagName("div");
|
2019-06-18 19:56:34 +00:00
|
|
|
|
|
|
|
for (Element table : document.select("table"))
|
|
|
|
if (table.parent() != null && "a".equals(table.parent().tagName()))
|
2019-06-30 07:51:43 +00:00
|
|
|
table.tagName("span"); // Links cannot contain tables
|
2019-06-18 19:56:34 +00:00
|
|
|
else
|
|
|
|
table.tagName("div");
|
2019-03-30 16:48:04 +00:00
|
|
|
|
2019-10-04 13:25:04 +00:00
|
|
|
// Remove tracking pixels
|
2019-09-13 11:46:52 +00:00
|
|
|
if (disable_tracking)
|
2019-10-04 13:25:04 +00:00
|
|
|
removeTrackingPixels(context, document);
|
2019-09-13 11:46:52 +00:00
|
|
|
|
|
|
|
// Images
|
2020-02-08 19:57:37 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/HTML/Element/img
|
2019-06-30 07:59:03 +00:00
|
|
|
for (Element img : document.select("img")) {
|
2019-10-14 06:50:27 +00:00
|
|
|
String alt = img.attr("alt");
|
|
|
|
String src = img.attr("src");
|
|
|
|
String tracking = img.attr("tracking");
|
|
|
|
|
2019-10-19 08:19:05 +00:00
|
|
|
if (!show_images && !TextUtils.isEmpty(alt))
|
|
|
|
if (TextUtils.isEmpty(tracking))
|
2020-02-10 07:41:55 +00:00
|
|
|
img.appendText("[" + alt + "]");
|
2019-10-19 08:19:05 +00:00
|
|
|
else {
|
2019-10-05 07:38:36 +00:00
|
|
|
img.append(" ");
|
2019-10-19 08:19:05 +00:00
|
|
|
Element a = document.createElement("a");
|
|
|
|
a.attr("href", tracking);
|
|
|
|
a.text(alt);
|
|
|
|
img.appendChild(a);
|
|
|
|
img.appendText(" ");
|
2019-06-30 07:41:18 +00:00
|
|
|
}
|
2019-07-26 18:45:53 +00:00
|
|
|
|
|
|
|
// Annotate source with width and height
|
2019-10-14 06:50:27 +00:00
|
|
|
if (!TextUtils.isEmpty(src)) {
|
2019-07-26 19:33:32 +00:00
|
|
|
int width = 0;
|
|
|
|
int height = 0;
|
2019-07-26 18:45:53 +00:00
|
|
|
|
2019-07-27 05:32:26 +00:00
|
|
|
String awidth = img.attr("width");
|
|
|
|
for (int i = 0; i < awidth.length(); i++)
|
|
|
|
if (Character.isDigit(awidth.charAt(i)))
|
|
|
|
width = width * 10 + (byte) awidth.charAt(i) - (byte) '0';
|
|
|
|
else
|
|
|
|
break;
|
|
|
|
|
|
|
|
String aheight = img.attr("height");
|
|
|
|
for (int i = 0; i < aheight.length(); i++)
|
|
|
|
if (Character.isDigit(aheight.charAt(i)))
|
|
|
|
height = height * 10 + (byte) aheight.charAt(i) - (byte) '0';
|
|
|
|
else
|
|
|
|
break;
|
2019-07-26 19:33:32 +00:00
|
|
|
|
|
|
|
if (width != 0 || height != 0) {
|
2019-10-05 09:57:54 +00:00
|
|
|
ImageHelper.AnnotatedSource a = new ImageHelper.AnnotatedSource(
|
2019-10-14 06:50:27 +00:00
|
|
|
src, width, height, !TextUtils.isEmpty(tracking));
|
2019-07-26 19:33:32 +00:00
|
|
|
img.attr("src", a.getAnnotated());
|
|
|
|
}
|
2019-07-26 18:45:53 +00:00
|
|
|
}
|
2019-06-30 07:59:03 +00:00
|
|
|
}
|
2019-03-30 16:48:04 +00:00
|
|
|
|
2019-06-30 07:41:18 +00:00
|
|
|
// Autolink
|
2020-03-25 19:25:06 +00:00
|
|
|
if (view) {
|
2019-11-15 07:43:35 +00:00
|
|
|
final Pattern pattern = Pattern.compile(
|
|
|
|
PatternsCompat.AUTOLINK_EMAIL_ADDRESS.pattern() + "|" +
|
|
|
|
PatternsCompat.AUTOLINK_WEB_URL.pattern());
|
|
|
|
|
|
|
|
NodeTraversor.traverse(new NodeVisitor() {
|
|
|
|
private int links = 0;
|
|
|
|
|
|
|
|
@Override
|
|
|
|
public void head(Node node, int depth) {
|
|
|
|
if (links < MAX_AUTO_LINK && node instanceof TextNode) {
|
|
|
|
TextNode tnode = (TextNode) node;
|
|
|
|
String text = tnode.getWholeText();
|
|
|
|
|
|
|
|
Matcher matcher = pattern.matcher(text);
|
|
|
|
if (matcher.find()) {
|
|
|
|
Element span = document.createElement("span");
|
|
|
|
|
|
|
|
int pos = 0;
|
|
|
|
do {
|
|
|
|
boolean linked = false;
|
|
|
|
Node parent = tnode.parent();
|
|
|
|
while (parent != null) {
|
|
|
|
if ("a".equals(parent.nodeName())) {
|
|
|
|
linked = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
parent = parent.parent();
|
2019-03-12 09:04:16 +00:00
|
|
|
}
|
2019-02-19 07:29:03 +00:00
|
|
|
|
2019-11-15 07:43:35 +00:00
|
|
|
boolean email = matcher.group().contains("@") && !matcher.group().contains(":");
|
2019-12-07 16:02:42 +00:00
|
|
|
Log.d("Web url=" + matcher.group() +
|
|
|
|
" " + matcher.start() + "..." + matcher.end() + "/" + text.length() +
|
|
|
|
" linked=" + linked + " email=" + email + " count=" + links);
|
2019-02-19 07:29:03 +00:00
|
|
|
|
2019-11-15 07:43:35 +00:00
|
|
|
if (linked)
|
|
|
|
span.appendText(text.substring(pos, matcher.end()));
|
|
|
|
else {
|
|
|
|
span.appendText(text.substring(pos, matcher.start()));
|
2019-02-19 07:29:03 +00:00
|
|
|
|
2019-11-15 07:43:35 +00:00
|
|
|
Element a = document.createElement("a");
|
|
|
|
a.attr("href", (email ? "mailto:" : "") + matcher.group());
|
|
|
|
a.text(matcher.group());
|
|
|
|
span.appendChild(a);
|
2019-08-20 18:05:11 +00:00
|
|
|
|
2019-11-15 07:43:35 +00:00
|
|
|
links++;
|
|
|
|
}
|
2019-02-19 07:29:03 +00:00
|
|
|
|
2019-11-15 07:43:35 +00:00
|
|
|
pos = matcher.end();
|
|
|
|
} while (links < MAX_AUTO_LINK && matcher.find());
|
2019-06-13 08:20:45 +00:00
|
|
|
|
2019-11-15 07:43:35 +00:00
|
|
|
span.appendText(text.substring(pos));
|
2019-02-16 21:55:44 +00:00
|
|
|
|
2019-11-15 07:43:35 +00:00
|
|
|
tnode.before(span);
|
|
|
|
tnode.text("");
|
|
|
|
}
|
2018-09-02 11:18:32 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-11-15 07:43:35 +00:00
|
|
|
@Override
|
|
|
|
public void tail(Node node, int depth) {
|
|
|
|
}
|
|
|
|
}, document);
|
|
|
|
}
|
2019-03-12 09:04:16 +00:00
|
|
|
|
2020-02-06 13:24:15 +00:00
|
|
|
for (Element div : document.select("div")) {
|
|
|
|
boolean inline = Boolean.parseBoolean(div.attr("inline"));
|
|
|
|
if (inline)
|
|
|
|
div.tagName("span");
|
|
|
|
}
|
|
|
|
|
2019-09-12 08:45:54 +00:00
|
|
|
// Selective new lines
|
2020-02-06 09:35:35 +00:00
|
|
|
for (Element div : document.select("div")) {
|
2020-02-06 09:45:52 +00:00
|
|
|
Node prev = div.previousSibling();
|
2020-02-06 16:06:09 +00:00
|
|
|
if (prev != null && hasVisibleContent(Arrays.asList(prev)))
|
2020-02-06 09:45:52 +00:00
|
|
|
div.prependElement("br");
|
|
|
|
|
2020-02-06 15:59:05 +00:00
|
|
|
if (hasVisibleContent(div.childNodes()))
|
2019-09-11 17:52:04 +00:00
|
|
|
div.appendElement("br");
|
2020-02-06 09:35:35 +00:00
|
|
|
}
|
2019-09-12 08:45:54 +00:00
|
|
|
|
|
|
|
for (Element div : document.select("div"))
|
|
|
|
div.tagName("span");
|
2019-07-08 18:14:33 +00:00
|
|
|
|
2020-04-21 10:27:32 +00:00
|
|
|
for (Element e : document.select("*[line-before],*[line-after]")) {
|
2020-04-21 17:44:35 +00:00
|
|
|
if (!TextUtils.isEmpty(e.attr("line-before"))) {
|
|
|
|
Element prev = e.previousElementSibling();
|
|
|
|
if (prev == null || !"br".equals(prev.tagName()))
|
|
|
|
e.prependElement("br");
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!TextUtils.isEmpty(e.attr("line-after"))) {
|
|
|
|
Element next = e.nextElementSibling();
|
|
|
|
if (next == null || !"br".equals(next.tagName()))
|
|
|
|
e.appendElement("br");
|
|
|
|
}
|
2020-04-21 10:27:32 +00:00
|
|
|
}
|
2020-04-13 17:31:02 +00:00
|
|
|
|
2019-09-25 13:20:27 +00:00
|
|
|
if (Build.VERSION.SDK_INT < Build.VERSION_CODES.N)
|
|
|
|
for (Element span : document.select("span"))
|
|
|
|
if (!TextUtils.isEmpty(span.attr("color")))
|
|
|
|
span.tagName("font");
|
|
|
|
|
2019-11-22 18:16:02 +00:00
|
|
|
if (document.body() == null) {
|
|
|
|
Log.e("Sanitize without body");
|
|
|
|
document.normalise();
|
|
|
|
}
|
|
|
|
|
2019-11-19 20:53:12 +00:00
|
|
|
return document;
|
2018-08-02 13:33:06 +00:00
|
|
|
}
|
2018-12-14 09:11:45 +00:00
|
|
|
|
2020-04-21 07:04:55 +00:00
|
|
|
private static String processClass(String clazz, String style, List<CSSStyleSheet> sheets) {
|
|
|
|
for (CSSStyleSheet sheet : sheets)
|
|
|
|
if (isScreenMedia(sheet.getMedia()))
|
|
|
|
style = processClass(clazz, style, sheet.getCssRules());
|
|
|
|
return style;
|
|
|
|
}
|
|
|
|
|
|
|
|
private static String processClass(String clazz, String style, CSSRuleList rules) {
|
|
|
|
for (int i = 0; rules != null && i < rules.getLength(); i++) {
|
|
|
|
CSSRule rule = rules.item(i);
|
|
|
|
switch (rule.getType()) {
|
|
|
|
case CSSRule.STYLE_RULE:
|
|
|
|
CSSStyleRuleImpl srule = (CSSStyleRuleImpl) rule;
|
|
|
|
for (int j = 0; j < srule.getSelectors().getLength(); j++) {
|
|
|
|
Selector selector = srule.getSelectors().item(j);
|
|
|
|
switch (selector.getSelectorType()) {
|
|
|
|
case Selector.SAC_CONDITIONAL_SELECTOR:
|
|
|
|
ConditionalSelectorImpl cselector = (ConditionalSelectorImpl) selector;
|
|
|
|
if (cselector.getCondition().getConditionType() == SAC_CLASS_CONDITION) {
|
|
|
|
ClassConditionImpl ccondition = (ClassConditionImpl) cselector.getCondition();
|
|
|
|
if (clazz.equals(ccondition.getValue()))
|
|
|
|
style = mergeStyles(srule.getStyle().getCssText(), style);
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case CSSRule.MEDIA_RULE:
|
|
|
|
CSSMediaRuleImpl mrule = (CSSMediaRuleImpl) rule;
|
|
|
|
if (isScreenMedia(mrule.getMedia()))
|
|
|
|
style = processClass(clazz, style, mrule.getCssRules());
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return style;
|
|
|
|
}
|
|
|
|
|
|
|
|
private static boolean isScreenMedia(MediaList media) {
|
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/CSS/Media_Queries/Using_media_queries
|
2020-04-21 09:41:52 +00:00
|
|
|
// https://developers.google.com/gmail/design/reference/supported_css#supported_types
|
2020-04-21 07:04:55 +00:00
|
|
|
if (media instanceof MediaListImpl) {
|
|
|
|
MediaListImpl _media = (MediaListImpl) media;
|
|
|
|
for (int i = 0; i < _media.getLength(); i++) {
|
|
|
|
String query = _media.mediaQuery(i).getCssText(null);
|
|
|
|
if ("all".equals(query) ||
|
|
|
|
"screen".equals(query) || "only screen".equals(query))
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
} else
|
|
|
|
Log.e("Media class=" + media.getClass().getName());
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2020-04-20 13:01:05 +00:00
|
|
|
private static String mergeStyles(String base, String style) {
|
2020-04-21 18:29:58 +00:00
|
|
|
return mergeStyles(base, style, null);
|
|
|
|
}
|
|
|
|
|
|
|
|
private static String mergeStyles(String base, String style, String selector) {
|
2020-04-20 13:01:05 +00:00
|
|
|
Map<String, String> result = new HashMap<>();
|
|
|
|
|
|
|
|
List<String> params = new ArrayList<>();
|
|
|
|
if (!TextUtils.isEmpty(base))
|
|
|
|
params.addAll(Arrays.asList(base.split(";")));
|
|
|
|
if (!TextUtils.isEmpty(style))
|
|
|
|
params.addAll(Arrays.asList(style.split(";")));
|
|
|
|
|
|
|
|
for (String param : params) {
|
|
|
|
int colon = param.indexOf(':');
|
|
|
|
if (colon > 0) {
|
|
|
|
String key = param.substring(0, colon).trim().toLowerCase(Locale.ROOT);
|
2020-04-21 18:29:58 +00:00
|
|
|
if (selector == null || selector.equals(key))
|
|
|
|
result.put(key, param);
|
2020-04-20 13:01:05 +00:00
|
|
|
} else
|
|
|
|
Log.w("Invalid style param=" + param);
|
|
|
|
}
|
|
|
|
|
|
|
|
return TextUtils.join(";", result.values());
|
|
|
|
}
|
|
|
|
|
2020-02-09 09:31:37 +00:00
|
|
|
private static Integer getFontWeight(String value) {
|
|
|
|
if (TextUtils.isEmpty(value))
|
|
|
|
return null;
|
|
|
|
|
|
|
|
value = value.toLowerCase(Locale.ROOT).trim();
|
|
|
|
|
|
|
|
switch (value) {
|
|
|
|
case "lighter":
|
|
|
|
return 300;
|
|
|
|
case "normal":
|
|
|
|
return 400;
|
|
|
|
case "bolder":
|
|
|
|
return 600;
|
|
|
|
case "bold":
|
|
|
|
return 700;
|
|
|
|
}
|
|
|
|
|
|
|
|
try {
|
|
|
|
return Integer.parseInt(value);
|
|
|
|
} catch (NumberFormatException ignored) {
|
|
|
|
}
|
|
|
|
|
|
|
|
return null;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2020-02-20 10:28:55 +00:00
|
|
|
private static Float getFontSize(String value, Integer current) {
|
2020-04-22 08:50:58 +00:00
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/CSS/font-size
|
2020-02-09 09:31:37 +00:00
|
|
|
if (TextUtils.isEmpty(value))
|
|
|
|
return null;
|
|
|
|
|
2020-04-22 08:50:58 +00:00
|
|
|
if (value.contains("calc") ||
|
|
|
|
"auto".equals(value) ||
|
|
|
|
"inherit".equals(value))
|
|
|
|
return null;
|
|
|
|
|
2020-04-20 07:57:42 +00:00
|
|
|
float _current = (current == null ? 1.0f : current / (float) DEFAULT_FONT_SIZE);
|
|
|
|
|
|
|
|
// Absolute
|
|
|
|
switch (value) {
|
|
|
|
case "xx-small":
|
|
|
|
case "x-small":
|
|
|
|
case "small":
|
|
|
|
return FONT_SMALL;
|
|
|
|
case "medium":
|
|
|
|
return 1.0f;
|
|
|
|
case "large":
|
|
|
|
case "x-large":
|
|
|
|
case "xx-large":
|
|
|
|
case "xxx-large":
|
|
|
|
return FONT_LARGE;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Relative
|
|
|
|
switch (value) {
|
|
|
|
case "smaller":
|
|
|
|
return FONT_SMALL * _current;
|
|
|
|
case "larger":
|
|
|
|
return FONT_LARGE * _current;
|
|
|
|
}
|
2020-02-09 09:31:37 +00:00
|
|
|
|
|
|
|
try {
|
2020-04-20 07:57:42 +00:00
|
|
|
if (value.endsWith("%"))
|
|
|
|
return Integer.parseInt(value.substring(0, value.length() - 1).trim()) / 100f * _current;
|
2020-02-09 09:31:37 +00:00
|
|
|
if (value.endsWith("em"))
|
2020-04-20 07:57:42 +00:00
|
|
|
return Float.parseFloat(value.substring(0, value.length() - 2).trim()) * _current;
|
2020-02-20 10:28:55 +00:00
|
|
|
if (value.endsWith("rem"))
|
|
|
|
return Float.parseFloat(value.substring(0, value.length() - 3).trim());
|
2020-04-22 08:50:58 +00:00
|
|
|
if (value.endsWith("px") || value.endsWith("pt"))
|
2020-02-20 10:37:40 +00:00
|
|
|
return Integer.parseInt(value.substring(0, value.length() - 2).trim()) / (float) DEFAULT_FONT_SIZE;
|
2020-04-22 08:50:58 +00:00
|
|
|
if (value.endsWith("cm") || value.endsWith("in"))
|
|
|
|
return null;
|
2020-02-20 10:37:40 +00:00
|
|
|
return Integer.parseInt(value.trim()) / (float) DEFAULT_FONT_SIZE;
|
2020-04-20 07:57:42 +00:00
|
|
|
} catch (NumberFormatException ex) {
|
|
|
|
Log.w(ex);
|
2020-02-09 09:31:37 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
2020-01-31 12:52:57 +00:00
|
|
|
private static Integer parseColor(@NonNull String value, boolean dark) {
|
|
|
|
// https://developer.mozilla.org/en-US/docs/Web/CSS/color_value
|
|
|
|
String c = value
|
2020-02-04 09:19:17 +00:00
|
|
|
.replace("null", "")
|
2020-01-31 12:52:57 +00:00
|
|
|
.replace("none", "")
|
|
|
|
.replace("unset", "")
|
2020-02-10 08:34:15 +00:00
|
|
|
.replace("auto", "")
|
2020-01-31 12:52:57 +00:00
|
|
|
.replace("inherit", "")
|
|
|
|
.replace("initial", "")
|
|
|
|
.replace("windowtext", "")
|
2020-02-07 08:58:22 +00:00
|
|
|
.replace("currentcolor", "")
|
2020-01-31 12:52:57 +00:00
|
|
|
.replace("transparent", "")
|
2020-02-04 09:19:17 +00:00
|
|
|
.replaceAll("[^a-z0-9(),.%#]", "")
|
|
|
|
.replaceAll("#+", "#");
|
2020-01-31 12:52:57 +00:00
|
|
|
|
|
|
|
Integer color = null;
|
|
|
|
try {
|
|
|
|
if (TextUtils.isEmpty(c))
|
|
|
|
return null;
|
2020-02-04 09:00:07 +00:00
|
|
|
else if (c.startsWith("#")) {
|
2020-02-04 09:19:17 +00:00
|
|
|
if (c.length() > 1) {
|
|
|
|
String code = c.substring(1);
|
|
|
|
if (x11ColorMap.containsKey(code)) // workaround
|
2020-02-08 17:45:28 +00:00
|
|
|
color = x11ColorMap.get(code);
|
2020-02-04 09:19:17 +00:00
|
|
|
else
|
2020-02-15 19:05:12 +00:00
|
|
|
color = Long.decode(c).intValue();
|
2020-02-04 09:19:17 +00:00
|
|
|
}
|
2020-02-04 09:00:07 +00:00
|
|
|
} else if (c.startsWith("rgb") || c.startsWith("hsl")) {
|
2020-01-31 12:52:57 +00:00
|
|
|
int s = c.indexOf("(");
|
|
|
|
int e = c.indexOf(")");
|
|
|
|
if (s > 0 && e > s) {
|
|
|
|
String[] component = c.substring(s + 1, e).split(",");
|
|
|
|
|
|
|
|
for (int i = 0; i < component.length; i++)
|
|
|
|
if (component[i].endsWith("%"))
|
|
|
|
if (c.startsWith("rgb")) {
|
|
|
|
int percent = Integer.parseInt(component[i].replace("%", ""));
|
|
|
|
component[i] = Integer.toString(Math.round(255 * (percent / 100f)));
|
|
|
|
} else
|
|
|
|
component[i] = component[i].replace("%", "");
|
|
|
|
|
|
|
|
if (c.startsWith("rgb") && component.length >= 3)
|
|
|
|
color = Color.rgb(
|
|
|
|
Integer.parseInt(component[0]),
|
|
|
|
Integer.parseInt(component[1]),
|
|
|
|
Integer.parseInt(component[2]));
|
|
|
|
else if (c.startsWith("hsl") && component.length >= 3)
|
|
|
|
color = ColorUtils.HSLToColor(new float[]{
|
|
|
|
Float.parseFloat(component[0]),
|
|
|
|
Integer.parseInt(component[1]) / 100f,
|
|
|
|
Integer.parseInt(component[2]) / 100f});
|
|
|
|
}
|
|
|
|
} else if (x11ColorMap.containsKey(c))
|
2020-02-08 17:45:28 +00:00
|
|
|
color = x11ColorMap.get(c);
|
2020-01-31 12:52:57 +00:00
|
|
|
else
|
|
|
|
try {
|
|
|
|
color = Color.parseColor(c);
|
|
|
|
} catch (IllegalArgumentException ex) {
|
2020-02-04 09:00:07 +00:00
|
|
|
// Workaround
|
2020-02-15 19:05:12 +00:00
|
|
|
color = Long.decode("#" + c).intValue();
|
2020-01-31 12:52:57 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (BuildConfig.DEBUG)
|
|
|
|
Log.i("Color " + c + "=" + (color == null ? null : Long.toHexString(color)));
|
|
|
|
|
|
|
|
} catch (Throwable ex) {
|
|
|
|
Log.e("Color=" + c + ": " + ex);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (color != null) {
|
|
|
|
if (dark || color != Color.BLACK)
|
|
|
|
color = Helper.adjustLuminance(color, dark, MIN_LUMINANCE);
|
2020-01-31 13:45:51 +00:00
|
|
|
|
|
|
|
color &= 0xFFFFFF;
|
2020-01-31 12:52:57 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return color;
|
|
|
|
}
|
|
|
|
|
2019-09-12 16:53:57 +00:00
|
|
|
private static boolean hasVisibleContent(List<Node> nodes) {
|
2019-09-12 08:45:54 +00:00
|
|
|
for (Node node : nodes)
|
|
|
|
if (node instanceof TextNode && !((TextNode) node).isBlank())
|
|
|
|
return true;
|
|
|
|
else if (node instanceof Element) {
|
|
|
|
Element element = (Element) node;
|
|
|
|
if (!element.isBlock() &&
|
2020-02-04 10:33:08 +00:00
|
|
|
(element.hasText() ||
|
|
|
|
element.selectFirst("a") != null ||
|
|
|
|
element.selectFirst("img") != null))
|
2019-09-12 08:45:54 +00:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
2019-09-02 17:01:17 +00:00
|
|
|
}
|
|
|
|
|
2020-04-07 17:43:02 +00:00
|
|
|
// https://tools.ietf.org/html/rfc3676
|
|
|
|
static String flow(String text) {
|
|
|
|
boolean continuation = false;
|
|
|
|
StringBuilder flowed = new StringBuilder();
|
|
|
|
for (String line : text.split("\\r?\\n")) {
|
|
|
|
if (continuation)
|
|
|
|
while (line.startsWith(">")) {
|
|
|
|
line = line.substring(1);
|
|
|
|
if (line.startsWith(" "))
|
|
|
|
line = line.substring(1);
|
|
|
|
}
|
|
|
|
|
|
|
|
continuation = (line.endsWith(" ") && !"-- ".equals(line));
|
|
|
|
|
|
|
|
flowed.append(line);
|
|
|
|
if (!continuation)
|
|
|
|
flowed.append("\r\n");
|
|
|
|
}
|
|
|
|
return flowed.toString();
|
|
|
|
}
|
|
|
|
|
2019-11-19 08:57:55 +00:00
|
|
|
static String formatPre(String text) {
|
|
|
|
int level = 0;
|
|
|
|
StringBuilder sb = new StringBuilder();
|
|
|
|
String[] lines = text.split("\\r?\\n");
|
|
|
|
for (String line : lines) {
|
|
|
|
// Opening quotes
|
|
|
|
int tlevel = 0;
|
|
|
|
while (line.startsWith(">")) {
|
|
|
|
tlevel++;
|
|
|
|
if (tlevel > level)
|
|
|
|
sb.append("<blockquote>");
|
|
|
|
|
|
|
|
line = line.substring(1); // >
|
|
|
|
|
|
|
|
if (line.startsWith(" "))
|
|
|
|
line = line.substring(1);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Closing quotes
|
|
|
|
for (int i = 0; i < level - tlevel; i++)
|
|
|
|
sb.append("</blockquote>");
|
|
|
|
level = tlevel;
|
|
|
|
|
|
|
|
// Tabs characters
|
|
|
|
StringBuilder l = new StringBuilder();
|
|
|
|
for (int j = 0; j < line.length(); j++) {
|
|
|
|
char kar = line.charAt(j);
|
|
|
|
if (kar == '\t') {
|
|
|
|
l.append(' ');
|
|
|
|
while (l.length() % TAB_SIZE != 0)
|
|
|
|
l.append(' ');
|
|
|
|
} else
|
|
|
|
l.append(kar);
|
|
|
|
}
|
|
|
|
line = l.toString();
|
|
|
|
|
|
|
|
// Html characters
|
|
|
|
line = Html.escapeHtml(line);
|
|
|
|
|
|
|
|
// Space characters
|
|
|
|
int len = line.length();
|
|
|
|
for (int j = 0; j < len; j++) {
|
|
|
|
char kar = line.charAt(j);
|
|
|
|
if (kar == ' ') {
|
|
|
|
// Prevent trimming start
|
|
|
|
// Keep one space for word wrapping
|
|
|
|
if (j == 0 || (j + 1 < len && line.charAt(j + 1) == ' '))
|
|
|
|
sb.append(" ");
|
|
|
|
else
|
|
|
|
sb.append(' ');
|
|
|
|
} else
|
|
|
|
sb.append(kar);
|
|
|
|
}
|
|
|
|
|
|
|
|
sb.append("<br>");
|
|
|
|
}
|
|
|
|
|
|
|
|
// Closing quotes
|
|
|
|
for (int i = 0; i < level; i++)
|
|
|
|
sb.append("</blockquote>");
|
|
|
|
|
|
|
|
return sb.toString();
|
|
|
|
}
|
|
|
|
|
2019-10-04 13:25:04 +00:00
|
|
|
static void removeTrackingPixels(Context context, Document document) {
|
2019-10-04 21:04:03 +00:00
|
|
|
Drawable d = ContextCompat.getDrawable(context, R.drawable.baseline_my_location_24);
|
|
|
|
d.setTint(Helper.resolveColor(context, R.attr.colorWarning));
|
2019-10-05 07:38:36 +00:00
|
|
|
|
2019-10-04 21:04:03 +00:00
|
|
|
Bitmap bm = Bitmap.createBitmap(d.getIntrinsicWidth(), d.getIntrinsicHeight(), Bitmap.Config.ARGB_8888);
|
|
|
|
Canvas c = new Canvas(bm);
|
|
|
|
d.setBounds(0, 0, c.getWidth(), c.getHeight());
|
|
|
|
d.draw(c);
|
|
|
|
|
|
|
|
ByteArrayOutputStream bos = new ByteArrayOutputStream();
|
|
|
|
bm.compress(Bitmap.CompressFormat.PNG, 100, bos);
|
|
|
|
|
|
|
|
StringBuilder sb = new StringBuilder();
|
2019-10-05 07:38:36 +00:00
|
|
|
sb.append("data:image/png;base64,");
|
2019-10-05 09:57:54 +00:00
|
|
|
sb.append(Base64.encodeToString(bos.toByteArray(), Base64.NO_WRAP));
|
2019-10-04 21:04:03 +00:00
|
|
|
|
2019-10-04 13:25:04 +00:00
|
|
|
// Build list of allowed hosts
|
|
|
|
List<String> hosts = new ArrayList<>();
|
|
|
|
for (Element img : document.select("img")) {
|
|
|
|
String src = img.attr("src");
|
|
|
|
if (!TextUtils.isEmpty(src) && !isTrackingPixel(img)) {
|
|
|
|
Uri uri = Uri.parse(img.attr("src"));
|
|
|
|
String host = uri.getHost();
|
|
|
|
if (host != null && !hosts.contains(host))
|
|
|
|
hosts.add(host);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Images
|
|
|
|
for (Element img : document.select("img")) {
|
2019-10-05 09:57:54 +00:00
|
|
|
img.removeAttr("tracking");
|
2019-10-04 13:25:04 +00:00
|
|
|
String src = img.attr("src");
|
|
|
|
if (!TextUtils.isEmpty(src) && isTrackingPixel(img)) {
|
2019-10-14 06:50:27 +00:00
|
|
|
Uri uri = Uri.parse(src);
|
2019-10-04 13:25:04 +00:00
|
|
|
String host = uri.getHost();
|
2020-04-08 07:57:29 +00:00
|
|
|
if (host != null && !hosts.contains(host)) {
|
2019-10-04 21:04:03 +00:00
|
|
|
img.attr("src", sb.toString());
|
|
|
|
img.attr("alt", context.getString(R.string.title_legend_tracking_pixel));
|
|
|
|
img.attr("height", "24");
|
|
|
|
img.attr("width", "24");
|
2019-10-05 09:57:54 +00:00
|
|
|
img.attr("style", "display:block !important; width:24px !important; height:24px !important;");
|
2019-10-14 06:50:27 +00:00
|
|
|
img.attr("tracking", src);
|
2019-10-04 13:25:04 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-10-04 19:25:52 +00:00
|
|
|
private static boolean isTrackingPixel(Element img) {
|
|
|
|
String width = img.attr("width").trim();
|
|
|
|
String height = img.attr("height").trim();
|
2019-03-30 16:55:00 +00:00
|
|
|
|
2019-10-04 19:25:52 +00:00
|
|
|
if (TextUtils.isEmpty(width) || TextUtils.isEmpty(height))
|
|
|
|
return false;
|
2018-12-14 09:11:45 +00:00
|
|
|
|
2019-10-03 06:55:37 +00:00
|
|
|
try {
|
2019-10-04 19:25:52 +00:00
|
|
|
return (Integer.parseInt(width) * Integer.parseInt(height) <= TRACKING_PIXEL_SURFACE);
|
|
|
|
} catch (NumberFormatException ignored) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
2019-10-03 06:55:37 +00:00
|
|
|
|
2020-02-28 09:01:18 +00:00
|
|
|
static void embedInlineImages(Context context, long id, Document document, boolean local) throws IOException {
|
2019-10-04 19:25:52 +00:00
|
|
|
DB db = DB.getInstance(context);
|
|
|
|
for (Element img : document.select("img")) {
|
|
|
|
String src = img.attr("src");
|
|
|
|
if (src.startsWith("cid:")) {
|
|
|
|
String cid = '<' + src.substring(4) + '>';
|
2019-10-03 06:55:37 +00:00
|
|
|
EntityAttachment attachment = db.attachment().getAttachment(id, cid);
|
2019-10-04 19:25:52 +00:00
|
|
|
if (attachment != null && attachment.available) {
|
|
|
|
File file = attachment.getFile(context);
|
2020-02-28 09:01:18 +00:00
|
|
|
if (local) {
|
|
|
|
Uri uri = FileProvider.getUriForFile(context, BuildConfig.APPLICATION_ID, file);
|
|
|
|
img.attr("src", uri.toString());
|
|
|
|
Log.i("Inline image uri=" + uri);
|
|
|
|
} else {
|
|
|
|
try (InputStream is = new FileInputStream(file)) {
|
|
|
|
byte[] bytes = new byte[(int) file.length()];
|
|
|
|
if (is.read(bytes) != bytes.length)
|
|
|
|
throw new IOException("length");
|
|
|
|
|
|
|
|
StringBuilder sb = new StringBuilder();
|
|
|
|
sb.append("data:");
|
|
|
|
sb.append(attachment.type);
|
|
|
|
sb.append(";base64,");
|
|
|
|
sb.append(Base64.encodeToString(bytes, Base64.NO_WRAP));
|
|
|
|
|
|
|
|
img.attr("src", sb.toString());
|
|
|
|
}
|
2019-04-30 08:33:03 +00:00
|
|
|
}
|
|
|
|
}
|
2019-10-04 19:25:52 +00:00
|
|
|
}
|
2019-07-15 10:17:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-10-08 17:54:52 +00:00
|
|
|
static void setViewport(Document document) {
|
|
|
|
// https://developer.mozilla.org/en-US/docs/Mozilla/Mobile/Viewport_meta_tag
|
|
|
|
document.head().select("meta").select("[name=viewport]").remove();
|
|
|
|
|
|
|
|
document.head().prependChild(document.createElement("meta")
|
|
|
|
.attr("name", "viewport")
|
|
|
|
.attr("content", "width=device-width, initial-scale=1.0"));
|
|
|
|
|
|
|
|
Log.i(document.head().html());
|
2019-05-04 11:06:22 +00:00
|
|
|
}
|
|
|
|
|
2020-03-26 14:25:44 +00:00
|
|
|
static String getLanguage(Context context, String body) {
|
2020-02-20 09:35:01 +00:00
|
|
|
try {
|
2020-03-26 14:25:44 +00:00
|
|
|
SharedPreferences prefs = PreferenceManager.getDefaultSharedPreferences(context);
|
2020-03-26 19:28:17 +00:00
|
|
|
boolean language_detection = prefs.getBoolean("language_detection", false);
|
2020-03-26 14:34:42 +00:00
|
|
|
if (!language_detection)
|
2020-03-26 14:25:44 +00:00
|
|
|
return null;
|
|
|
|
|
|
|
|
if (Build.VERSION.SDK_INT >= Build.VERSION_CODES.Q) {
|
|
|
|
TextClassificationManager tcm =
|
|
|
|
(TextClassificationManager) context.getSystemService(Context.TEXT_CLASSIFICATION_SERVICE);
|
|
|
|
if (tcm == null)
|
|
|
|
return null;
|
|
|
|
|
|
|
|
String text = getPreview(body);
|
|
|
|
if (body == null)
|
|
|
|
return null;
|
|
|
|
|
|
|
|
TextLanguage.Request trequest = new TextLanguage.Request.Builder(text).build();
|
|
|
|
TextLanguage tlanguage = tcm.getTextClassifier().detectLanguage(trequest);
|
|
|
|
if (tlanguage.getLocaleHypothesisCount() > 0)
|
|
|
|
return tlanguage.getLocale(0).toLocale().getLanguage();
|
|
|
|
}
|
|
|
|
|
|
|
|
return null;
|
|
|
|
} catch (Throwable ex) {
|
2020-02-20 09:35:01 +00:00
|
|
|
Log.e(ex);
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-12-24 20:09:47 +00:00
|
|
|
static String getPreview(String body) {
|
2019-11-11 19:23:34 +00:00
|
|
|
try {
|
2020-02-20 09:35:01 +00:00
|
|
|
if (body == null)
|
|
|
|
return null;
|
|
|
|
Document d = JsoupEx.parse(body);
|
|
|
|
return _getText(d, false);
|
2019-11-11 19:23:34 +00:00
|
|
|
} catch (OutOfMemoryError ex) {
|
|
|
|
Log.e(ex);
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-02-20 09:35:01 +00:00
|
|
|
@Deprecated
|
2020-02-11 19:07:00 +00:00
|
|
|
static String getFullText(String body) {
|
|
|
|
try {
|
2020-02-20 09:35:01 +00:00
|
|
|
if (body == null)
|
|
|
|
return null;
|
|
|
|
Document d = JsoupEx.parse(body);
|
|
|
|
return _getText(d, true);
|
2020-02-11 19:07:00 +00:00
|
|
|
} catch (OutOfMemoryError ex) {
|
|
|
|
Log.e(ex);
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-02-20 09:35:01 +00:00
|
|
|
static String getFullText(File file) throws IOException {
|
|
|
|
try {
|
|
|
|
Document d = JsoupEx.parse(file);
|
|
|
|
return _getText(d, true);
|
|
|
|
} catch (OutOfMemoryError ex) {
|
|
|
|
Log.e(ex);
|
2019-10-03 16:07:56 +00:00
|
|
|
return null;
|
2020-02-20 09:35:01 +00:00
|
|
|
}
|
|
|
|
}
|
2019-10-03 16:07:56 +00:00
|
|
|
|
2020-02-20 09:35:01 +00:00
|
|
|
private static String _getText(Document d, boolean full) {
|
2020-02-14 10:06:48 +00:00
|
|
|
truncate(d, !full);
|
|
|
|
|
2020-02-28 16:58:31 +00:00
|
|
|
for (Element bq : d.select("blockquote")) {
|
|
|
|
bq.prependChild(new TextNode("["));
|
|
|
|
bq.appendChild(new TextNode("]"));
|
|
|
|
}
|
|
|
|
|
2020-02-14 10:06:48 +00:00
|
|
|
String text = d.text();
|
2020-02-11 19:07:00 +00:00
|
|
|
if (full)
|
|
|
|
return text;
|
2019-10-03 16:07:56 +00:00
|
|
|
|
|
|
|
String preview = text.substring(0, Math.min(text.length(), PREVIEW_SIZE));
|
|
|
|
if (preview.length() < text.length())
|
|
|
|
preview += "…";
|
|
|
|
|
|
|
|
return preview;
|
2019-01-05 11:17:33 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static String getText(String html) {
|
|
|
|
final StringBuilder sb = new StringBuilder();
|
|
|
|
|
2019-08-22 18:05:45 +00:00
|
|
|
html = html.replace("<br> ", "<br>");
|
|
|
|
|
2020-02-14 10:06:48 +00:00
|
|
|
Document d = JsoupEx.parse(html);
|
|
|
|
|
|
|
|
truncate(d, true);
|
|
|
|
|
2019-01-05 11:17:33 +00:00
|
|
|
NodeTraversor.traverse(new NodeVisitor() {
|
2019-02-10 12:01:21 +00:00
|
|
|
private int qlevel = 0;
|
2019-02-11 15:36:42 +00:00
|
|
|
private int tlevel = 0;
|
2019-09-07 06:22:46 +00:00
|
|
|
private int plevel = 0;
|
2019-11-22 19:42:45 +00:00
|
|
|
private int lindex = 0;
|
2019-02-10 12:01:21 +00:00
|
|
|
|
2020-03-10 07:29:18 +00:00
|
|
|
private final List<String> tails = Collections.unmodifiableList(Arrays.asList(
|
2020-03-11 17:08:19 +00:00
|
|
|
"h1", "h2", "h3", "h4", "h5", "h6", "p", "ol", "ul", "li", "div", "table", "br", "hr"));
|
2020-03-10 07:29:18 +00:00
|
|
|
|
2019-01-05 11:17:33 +00:00
|
|
|
public void head(Node node, int depth) {
|
2019-08-23 06:29:58 +00:00
|
|
|
if (node instanceof TextNode)
|
2019-09-07 06:22:46 +00:00
|
|
|
if (plevel > 0) {
|
|
|
|
String[] lines = ((TextNode) node).getWholeText().split("\\r?\\n");
|
|
|
|
for (String line : lines) {
|
2019-11-22 19:42:45 +00:00
|
|
|
append(line, true);
|
2019-09-07 06:22:46 +00:00
|
|
|
newline();
|
|
|
|
}
|
|
|
|
} else
|
|
|
|
append(((TextNode) node).text());
|
2019-08-23 06:29:58 +00:00
|
|
|
else {
|
2019-01-05 11:17:33 +00:00
|
|
|
String name = node.nodeName();
|
2020-03-08 15:05:43 +00:00
|
|
|
if ("li".equals(name) && node.parent() != null)
|
|
|
|
append("ol".equals(node.parent().nodeName()) ? "-" : "*");
|
2019-02-10 12:01:21 +00:00
|
|
|
else if ("blockquote".equals(name))
|
|
|
|
qlevel++;
|
2019-09-07 06:22:46 +00:00
|
|
|
else if ("pre".equals(name))
|
|
|
|
plevel++;
|
2019-01-05 11:17:33 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
public void tail(Node node, int depth) {
|
|
|
|
String name = node.nodeName();
|
2020-03-11 16:26:04 +00:00
|
|
|
if ("a".equals(name)) {
|
|
|
|
String addr = node.attr("href").toLowerCase();
|
|
|
|
if (addr.startsWith("mailto:"))
|
|
|
|
addr = addr.substring("mailto:".length());
|
|
|
|
String text = ((Element) node).text().toLowerCase();
|
|
|
|
if (!text.contains(addr))
|
|
|
|
append("[" + node.attr("href") + "]");
|
|
|
|
} else if ("img".equals(name))
|
2019-11-07 12:30:13 +00:00
|
|
|
append("[" + node.attr("src") + "]");
|
2019-08-23 06:29:58 +00:00
|
|
|
else if ("th".equals(name) || "td".equals(name)) {
|
2019-02-10 12:01:21 +00:00
|
|
|
Node next = node.nextSibling();
|
|
|
|
if (next == null || !("th".equals(next.nodeName()) || "td".equals(next.nodeName())))
|
|
|
|
newline();
|
2019-11-07 12:30:13 +00:00
|
|
|
else
|
|
|
|
append(" ");
|
2019-02-10 12:01:21 +00:00
|
|
|
} else if ("blockquote".equals(name))
|
|
|
|
qlevel--;
|
2019-09-07 06:22:46 +00:00
|
|
|
else if ("pre".equals(name))
|
|
|
|
plevel--;
|
2019-02-10 12:01:21 +00:00
|
|
|
|
2020-03-11 17:08:19 +00:00
|
|
|
if (tails.contains(name) &&
|
|
|
|
!("br".equals(name) &&
|
|
|
|
node.nextSibling() == null &&
|
|
|
|
node.parent() != null && "div".equals(node.parent().nodeName())))
|
2019-02-10 12:01:21 +00:00
|
|
|
newline();
|
|
|
|
}
|
|
|
|
|
2019-02-11 15:36:42 +00:00
|
|
|
private void append(String text) {
|
2019-11-22 19:42:45 +00:00
|
|
|
append(text, false);
|
|
|
|
}
|
|
|
|
|
|
|
|
private void append(String text, boolean raw) {
|
2019-02-11 15:36:42 +00:00
|
|
|
if (tlevel != qlevel) {
|
|
|
|
newline();
|
|
|
|
tlevel = qlevel;
|
|
|
|
}
|
2019-11-22 19:42:45 +00:00
|
|
|
|
|
|
|
if (!raw && !"-- ".equals(text)) {
|
|
|
|
text = text.trim();
|
|
|
|
if (lindex > 0)
|
|
|
|
text = " " + text;
|
|
|
|
}
|
|
|
|
|
2019-02-11 15:36:42 +00:00
|
|
|
sb.append(text);
|
2019-11-22 19:42:45 +00:00
|
|
|
lindex += text.length();
|
2019-02-11 15:36:42 +00:00
|
|
|
}
|
|
|
|
|
2019-02-10 12:01:21 +00:00
|
|
|
private void newline() {
|
2019-11-22 19:42:45 +00:00
|
|
|
lindex = 0;
|
2019-02-10 12:01:21 +00:00
|
|
|
sb.append("\n");
|
2019-11-22 19:42:45 +00:00
|
|
|
|
2019-02-10 12:01:21 +00:00
|
|
|
for (int i = 0; i < qlevel; i++)
|
2019-11-22 19:42:45 +00:00
|
|
|
sb.append("> ");
|
2019-01-05 11:17:33 +00:00
|
|
|
}
|
2020-02-14 10:06:48 +00:00
|
|
|
}, d);
|
2019-01-05 11:17:33 +00:00
|
|
|
|
2019-02-10 12:01:21 +00:00
|
|
|
sb.append("\n");
|
|
|
|
|
2019-01-05 11:17:33 +00:00
|
|
|
return sb.toString();
|
2018-12-24 20:09:47 +00:00
|
|
|
}
|
2020-03-08 15:05:43 +00:00
|
|
|
|
|
|
|
static void convertLists(Document document) {
|
2020-04-21 12:52:34 +00:00
|
|
|
for (Element span : document.select("span")) {
|
2020-03-15 12:49:17 +00:00
|
|
|
// Skip signature and referenced message
|
|
|
|
boolean body = true;
|
2020-04-21 12:52:34 +00:00
|
|
|
Element parent = span.parent();
|
2020-03-15 12:49:17 +00:00
|
|
|
while (parent != null) {
|
|
|
|
if ("div".equals(parent.tagName()) &&
|
|
|
|
!TextUtils.isEmpty(parent.attr("fairemail"))) {
|
|
|
|
body = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
parent = parent.parent();
|
|
|
|
}
|
|
|
|
if (!body)
|
|
|
|
continue;
|
|
|
|
|
2020-03-08 15:05:43 +00:00
|
|
|
Element list = null;
|
2020-04-21 12:52:34 +00:00
|
|
|
for (int i = 0; i < span.childNodeSize(); i++) {
|
2020-03-08 15:05:43 +00:00
|
|
|
boolean item = false;
|
2020-04-21 12:52:34 +00:00
|
|
|
Node node = span.childNode(i);
|
2020-03-08 15:05:43 +00:00
|
|
|
if (node instanceof TextNode) {
|
|
|
|
String text = ((TextNode) node).text().trim();
|
|
|
|
Node next = node.nextSibling();
|
|
|
|
if ((text.startsWith("* ") || text.startsWith("- ")) &&
|
|
|
|
(next == null || "br".equals(next.nodeName()))) {
|
|
|
|
item = true;
|
|
|
|
String type = (text.startsWith("* ") ? "ul" : "ol");
|
|
|
|
|
|
|
|
Element li = document.createElement("li");
|
|
|
|
li.text(text.substring(2));
|
|
|
|
|
|
|
|
if (list == null || !list.tagName().equals(type)) {
|
2020-04-21 12:52:34 +00:00
|
|
|
Node before = node.previousSibling();
|
|
|
|
if (before != null && "br".equals(before.nodeName())) {
|
|
|
|
before.remove();
|
|
|
|
i--;
|
|
|
|
}
|
|
|
|
|
2020-03-08 15:05:43 +00:00
|
|
|
list = document.createElement(type);
|
|
|
|
list.appendChild(li);
|
|
|
|
node.replaceWith(list);
|
2020-04-21 12:52:34 +00:00
|
|
|
|
2020-03-08 15:05:43 +00:00
|
|
|
} else {
|
|
|
|
list.appendChild(li);
|
|
|
|
node.remove();
|
|
|
|
i--;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (next != null)
|
|
|
|
next.remove();
|
|
|
|
}
|
2020-04-21 12:52:34 +00:00
|
|
|
} else {
|
|
|
|
if (list != null && "br".equals(node.nodeName())) {
|
|
|
|
node.remove();
|
|
|
|
i--;
|
|
|
|
}
|
2020-03-08 15:05:43 +00:00
|
|
|
}
|
|
|
|
if (!item)
|
|
|
|
list = null;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2019-02-10 12:01:21 +00:00
|
|
|
|
2019-08-29 19:57:04 +00:00
|
|
|
static Spanned highlightHeaders(Context context, String headers) {
|
|
|
|
int colorAccent = Helper.resolveColor(context, R.attr.colorAccent);
|
|
|
|
SpannableStringBuilder ssb = new SpannableStringBuilder(headers);
|
|
|
|
int index = 0;
|
|
|
|
for (String line : headers.split("\n")) {
|
|
|
|
if (line.length() > 0 && !Character.isWhitespace(line.charAt(0))) {
|
|
|
|
int colon = line.indexOf(':');
|
|
|
|
if (colon > 0)
|
|
|
|
ssb.setSpan(new ForegroundColorSpan(colorAccent), index, index + colon, 0);
|
|
|
|
}
|
|
|
|
index += line.length() + 1;
|
|
|
|
}
|
|
|
|
return ssb;
|
|
|
|
}
|
|
|
|
|
2020-02-14 12:31:34 +00:00
|
|
|
static void cleanup(Document d) {
|
2020-02-14 15:57:09 +00:00
|
|
|
// https://www.chromestatus.com/feature/5756335865987072
|
|
|
|
// Some messages contain 100 thousands of Apple spaces
|
2020-02-14 14:40:47 +00:00
|
|
|
for (Element aspace : d.select(".Apple-converted-space")) {
|
|
|
|
Node next = aspace.nextSibling();
|
|
|
|
if (next instanceof TextNode) {
|
|
|
|
TextNode tnode = (TextNode) next;
|
2020-02-14 15:57:09 +00:00
|
|
|
tnode.text(" " + tnode.text());
|
2020-02-14 12:31:34 +00:00
|
|
|
aspace.remove();
|
|
|
|
} else
|
|
|
|
aspace.replaceWith(new TextNode(" "));
|
2020-02-14 14:40:47 +00:00
|
|
|
}
|
2020-02-14 12:31:34 +00:00
|
|
|
}
|
|
|
|
|
2020-02-14 10:06:48 +00:00
|
|
|
static boolean truncate(Document d, boolean reformat) {
|
2020-02-16 09:08:46 +00:00
|
|
|
int max = (reformat ? MAX_FORMAT_TEXT_SIZE : MAX_FULL_TEXT_SIZE);
|
2020-02-14 10:06:48 +00:00
|
|
|
|
|
|
|
int length = 0;
|
2020-02-20 12:11:13 +00:00
|
|
|
int images = 0;
|
2020-02-14 10:06:48 +00:00
|
|
|
for (Element elm : d.select("*")) {
|
2020-02-20 12:11:13 +00:00
|
|
|
if ("img".equals(elm.tagName()))
|
|
|
|
images++;
|
2020-02-16 09:08:46 +00:00
|
|
|
|
2020-02-20 12:11:13 +00:00
|
|
|
boolean skip = false;
|
2020-02-16 09:08:46 +00:00
|
|
|
for (Node child : elm.childNodes()) {
|
|
|
|
if (child instanceof TextNode) {
|
|
|
|
TextNode tnode = ((TextNode) child);
|
|
|
|
String text = tnode.getWholeText();
|
|
|
|
|
|
|
|
if (length < max) {
|
|
|
|
if (length + text.length() >= max) {
|
|
|
|
text = text.substring(0, max - length) + " ...";
|
|
|
|
tnode.text(text);
|
|
|
|
skip = true;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if (skip)
|
2020-02-16 09:56:27 +00:00
|
|
|
tnode.text("");
|
2020-02-16 09:08:46 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
length += text.length();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (length >= max && !skip)
|
2020-02-14 10:06:48 +00:00
|
|
|
elm.remove();
|
|
|
|
}
|
2020-02-16 09:08:46 +00:00
|
|
|
|
2020-02-20 12:11:13 +00:00
|
|
|
Log.i("Message size=" + length + " images=" + images);
|
|
|
|
|
2020-02-16 09:08:46 +00:00
|
|
|
return (length >= max);
|
2020-02-14 10:06:48 +00:00
|
|
|
}
|
|
|
|
|
2020-02-20 09:07:01 +00:00
|
|
|
static boolean contains(Document d, String[] texts) {
|
|
|
|
Map<String, Boolean> condition = new HashMap<>();
|
|
|
|
for (String t : texts)
|
|
|
|
condition.put(t, false);
|
|
|
|
|
|
|
|
for (Element elm : d.select("*"))
|
|
|
|
for (Node child : elm.childNodes()) {
|
|
|
|
if (child instanceof TextNode) {
|
|
|
|
TextNode tnode = ((TextNode) child);
|
|
|
|
String text = tnode.getWholeText();
|
|
|
|
for (String t : texts)
|
|
|
|
if (!condition.get(t) && text.contains(t)) {
|
|
|
|
condition.put(t, true);
|
|
|
|
|
|
|
|
boolean found = true;
|
|
|
|
for (String c : texts)
|
|
|
|
if (!condition.get(c)) {
|
|
|
|
found = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (found)
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2019-02-10 12:01:21 +00:00
|
|
|
static Spanned fromHtml(@NonNull String html) {
|
|
|
|
return fromHtml(html, null, null);
|
|
|
|
}
|
|
|
|
|
|
|
|
static Spanned fromHtml(@NonNull String html, @Nullable Html.ImageGetter imageGetter, @Nullable Html.TagHandler tagHandler) {
|
2019-03-26 13:37:04 +00:00
|
|
|
Spanned spanned = HtmlCompat.fromHtml(html, FROM_HTML_SEPARATOR_LINE_BREAK_LIST_ITEM, imageGetter, tagHandler);
|
|
|
|
|
|
|
|
int i = spanned.length();
|
|
|
|
while (i > 1 && spanned.charAt(i - 2) == '\n' && spanned.charAt(i - 1) == '\n')
|
|
|
|
i--;
|
|
|
|
if (i != spanned.length())
|
|
|
|
spanned = (Spanned) spanned.subSequence(0, i);
|
|
|
|
|
|
|
|
return spanned;
|
2019-02-10 12:01:21 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static String toHtml(Spanned spanned) {
|
2019-05-01 13:58:41 +00:00
|
|
|
String html = HtmlCompat.toHtml(spanned, TO_HTML_PARAGRAPH_LINES_CONSECUTIVE);
|
|
|
|
|
|
|
|
// @Google: why convert size to and from in a different way?
|
2019-10-03 16:19:22 +00:00
|
|
|
Document doc = JsoupEx.parse(html);
|
2019-05-01 13:58:41 +00:00
|
|
|
for (Element element : doc.select("span")) {
|
|
|
|
String style = element.attr("style");
|
|
|
|
if (style.startsWith("font-size:")) {
|
|
|
|
int colon = style.indexOf(':');
|
|
|
|
int semi = style.indexOf("em;", colon);
|
|
|
|
if (semi > colon)
|
|
|
|
try {
|
|
|
|
String hsize = style.substring(colon + 1, semi).replace(',', '.');
|
|
|
|
float size = Float.parseFloat(hsize);
|
|
|
|
element.tagName(size < 1.0f ? "small" : "big");
|
|
|
|
element.attributes().remove("style");
|
|
|
|
} catch (NumberFormatException ex) {
|
|
|
|
Log.e(ex);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-09-23 17:18:21 +00:00
|
|
|
return doc.html();
|
2019-02-10 12:01:21 +00:00
|
|
|
}
|
2018-08-02 13:33:06 +00:00
|
|
|
}
|