package eu.faircode.email;
/*
This file is part of FairEmail.
FairEmail is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
FairEmail is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with FairEmail. If not, see .
Copyright 2018-2020 by Marcel Bokhorst (M66B)
*/
import android.content.Context;
import android.content.SharedPreferences;
import android.graphics.Bitmap;
import android.graphics.Canvas;
import android.graphics.Color;
import android.graphics.drawable.Drawable;
import android.net.Uri;
import android.os.Build;
import android.text.Html;
import android.text.SpannableStringBuilder;
import android.text.Spanned;
import android.text.TextUtils;
import android.text.style.ForegroundColorSpan;
import android.util.Base64;
import androidx.annotation.NonNull;
import androidx.annotation.Nullable;
import androidx.core.content.ContextCompat;
import androidx.core.text.HtmlCompat;
import androidx.core.util.PatternsCompat;
import androidx.preference.PreferenceManager;
import org.jsoup.nodes.Attribute;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.nodes.Node;
import org.jsoup.nodes.TextNode;
import org.jsoup.safety.Cleaner;
import org.jsoup.safety.Whitelist;
import org.jsoup.select.NodeTraversor;
import org.jsoup.select.NodeVisitor;
import java.io.ByteArrayOutputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collections;
import java.util.HashMap;
import java.util.List;
import java.util.Locale;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import static androidx.core.text.HtmlCompat.FROM_HTML_SEPARATOR_LINE_BREAK_LIST_ITEM;
import static androidx.core.text.HtmlCompat.TO_HTML_PARAGRAPH_LINES_CONSECUTIVE;
public class HtmlHelper {
private static final int PREVIEW_SIZE = 500; // characters
private static final float MIN_LUMINANCE = 0.5f;
private static final int TAB_SIZE = 2;
private static final int MAX_AUTO_LINK = 250;
private static final int TRACKING_PIXEL_SURFACE = 25; // pixels
private static final List heads = Collections.unmodifiableList(Arrays.asList(
"h1", "h2", "h3", "h4", "h5", "h6", "p", "ol", "ul", "table", "br", "hr"));
private static final List tails = Collections.unmodifiableList(Arrays.asList(
"h1", "h2", "h3", "h4", "h5", "h6", "p", "ol", "ul", "li"));
private static final HashMap x11ColorMap = new HashMap<>();
static {
// https://www.w3.org/TR/css-color-3/
x11ColorMap.put("aliceblue", 0xF0F8FF);
x11ColorMap.put("antiquewhite", 0xFAEBD7);
x11ColorMap.put("aqua", 0x00FFFF);
x11ColorMap.put("aquamarine", 0x7FFFD4);
x11ColorMap.put("azure", 0xF0FFFF);
x11ColorMap.put("beige", 0xF5F5DC);
x11ColorMap.put("bisque", 0xFFE4C4);
x11ColorMap.put("black", 0x000000);
x11ColorMap.put("blanchedalmond", 0xFFEBCD);
x11ColorMap.put("blue", 0x0000FF);
x11ColorMap.put("blueviolet", 0x8A2BE2);
x11ColorMap.put("brown", 0xA52A2A);
x11ColorMap.put("burlywood", 0xDEB887);
x11ColorMap.put("cadetblue", 0x5F9EA0);
x11ColorMap.put("chartreuse", 0x7FFF00);
x11ColorMap.put("chocolate", 0xD2691E);
x11ColorMap.put("coral", 0xFF7F50);
x11ColorMap.put("cornflowerblue", 0x6495ED);
x11ColorMap.put("cornsilk", 0xFFF8DC);
x11ColorMap.put("crimson", 0xDC143C);
x11ColorMap.put("cyan", 0x00FFFF);
x11ColorMap.put("darkblue", 0x00008B);
x11ColorMap.put("darkcyan", 0x008B8B);
x11ColorMap.put("darkgoldenrod", 0xB8860B);
x11ColorMap.put("darkgray", 0xA9A9A9);
x11ColorMap.put("darkgreen", 0x006400);
x11ColorMap.put("darkgrey", 0xA9A9A9);
x11ColorMap.put("darkkhaki", 0xBDB76B);
x11ColorMap.put("darkmagenta", 0x8B008B);
x11ColorMap.put("darkolivegreen", 0x556B2F);
x11ColorMap.put("darkorange", 0xFF8C00);
x11ColorMap.put("darkorchid", 0x9932CC);
x11ColorMap.put("darkred", 0x8B0000);
x11ColorMap.put("darksalmon", 0xE9967A);
x11ColorMap.put("darkseagreen", 0x8FBC8F);
x11ColorMap.put("darkslateblue", 0x483D8B);
x11ColorMap.put("darkslategray", 0x2F4F4F);
x11ColorMap.put("darkslategrey", 0x2F4F4F);
x11ColorMap.put("darkturquoise", 0x00CED1);
x11ColorMap.put("darkviolet", 0x9400D3);
x11ColorMap.put("deeppink", 0xFF1493);
x11ColorMap.put("deepskyblue", 0x00BFFF);
x11ColorMap.put("dimgray", 0x696969);
x11ColorMap.put("dimgrey", 0x696969);
x11ColorMap.put("dodgerblue", 0x1E90FF);
x11ColorMap.put("firebrick", 0xB22222);
x11ColorMap.put("floralwhite", 0xFFFAF0);
x11ColorMap.put("forestgreen", 0x228B22);
x11ColorMap.put("fuchsia", 0xFF00FF);
x11ColorMap.put("gainsboro", 0xDCDCDC);
x11ColorMap.put("ghostwhite", 0xF8F8FF);
x11ColorMap.put("gold", 0xFFD700);
x11ColorMap.put("goldenrod", 0xDAA520);
x11ColorMap.put("gray", 0x808080);
x11ColorMap.put("green", 0x008000);
x11ColorMap.put("greenyellow", 0xADFF2F);
x11ColorMap.put("grey", 0x808080);
x11ColorMap.put("honeydew", 0xF0FFF0);
x11ColorMap.put("hotpink", 0xFF69B4);
x11ColorMap.put("indianred", 0xCD5C5C);
x11ColorMap.put("indigo", 0x4B0082);
x11ColorMap.put("ivory", 0xFFFFF0);
x11ColorMap.put("khaki", 0xF0E68C);
x11ColorMap.put("lavender", 0xE6E6FA);
x11ColorMap.put("lavenderblush", 0xFFF0F5);
x11ColorMap.put("lawngreen", 0x7CFC00);
x11ColorMap.put("lemonchiffon", 0xFFFACD);
x11ColorMap.put("lightblue", 0xADD8E6);
x11ColorMap.put("lightcoral", 0xF08080);
x11ColorMap.put("lightcyan", 0xE0FFFF);
x11ColorMap.put("lightgoldenrodyellow", 0xFAFAD2);
x11ColorMap.put("lightgray", 0xD3D3D3);
x11ColorMap.put("lightgreen", 0x90EE90);
x11ColorMap.put("lightgrey", 0xD3D3D3);
x11ColorMap.put("lightpink", 0xFFB6C1);
x11ColorMap.put("lightsalmon", 0xFFA07A);
x11ColorMap.put("lightseagreen", 0x20B2AA);
x11ColorMap.put("lightskyblue", 0x87CEFA);
x11ColorMap.put("lightslategray", 0x778899);
x11ColorMap.put("lightslategrey", 0x778899);
x11ColorMap.put("lightsteelblue", 0xB0C4DE);
x11ColorMap.put("lightyellow", 0xFFFFE0);
x11ColorMap.put("lime", 0x00FF00);
x11ColorMap.put("limegreen", 0x32CD32);
x11ColorMap.put("linen", 0xFAF0E6);
x11ColorMap.put("magenta", 0xFF00FF);
x11ColorMap.put("maroon", 0x800000);
x11ColorMap.put("mediumaquamarine", 0x66CDAA);
x11ColorMap.put("mediumblue", 0x0000CD);
x11ColorMap.put("mediumorchid", 0xBA55D3);
x11ColorMap.put("mediumpurple", 0x9370DB);
x11ColorMap.put("mediumseagreen", 0x3CB371);
x11ColorMap.put("mediumslateblue", 0x7B68EE);
x11ColorMap.put("mediumspringgreen", 0x00FA9A);
x11ColorMap.put("mediumturquoise", 0x48D1CC);
x11ColorMap.put("mediumvioletred", 0xC71585);
x11ColorMap.put("midnightblue", 0x191970);
x11ColorMap.put("mintcream", 0xF5FFFA);
x11ColorMap.put("mistyrose", 0xFFE4E1);
x11ColorMap.put("moccasin", 0xFFE4B5);
x11ColorMap.put("navajowhite", 0xFFDEAD);
x11ColorMap.put("navy", 0x000080);
x11ColorMap.put("oldlace", 0xFDF5E6);
x11ColorMap.put("olive", 0x808000);
x11ColorMap.put("olivedrab", 0x6B8E23);
x11ColorMap.put("orange", 0xFFA500);
x11ColorMap.put("orangered", 0xFF4500);
x11ColorMap.put("orchid", 0xDA70D6);
x11ColorMap.put("palegoldenrod", 0xEEE8AA);
x11ColorMap.put("palegreen", 0x98FB98);
x11ColorMap.put("paleturquoise", 0xAFEEEE);
x11ColorMap.put("palevioletred", 0xDB7093);
x11ColorMap.put("papayawhip", 0xFFEFD5);
x11ColorMap.put("peachpuff", 0xFFDAB9);
x11ColorMap.put("peru", 0xCD853F);
x11ColorMap.put("pink", 0xFFC0CB);
x11ColorMap.put("plum", 0xDDA0DD);
x11ColorMap.put("powderblue", 0xB0E0E6);
x11ColorMap.put("purple", 0x800080);
x11ColorMap.put("red", 0xFF0000);
x11ColorMap.put("rosybrown", 0xBC8F8F);
x11ColorMap.put("royalblue", 0x4169E1);
x11ColorMap.put("saddlebrown", 0x8B4513);
x11ColorMap.put("salmon", 0xFA8072);
x11ColorMap.put("sandybrown", 0xF4A460);
x11ColorMap.put("seagreen", 0x2E8B57);
x11ColorMap.put("seashell", 0xFFF5EE);
x11ColorMap.put("sienna", 0xA0522D);
x11ColorMap.put("silver", 0xC0C0C0);
x11ColorMap.put("skyblue", 0x87CEEB);
x11ColorMap.put("slateblue", 0x6A5ACD);
x11ColorMap.put("slategray", 0x708090);
x11ColorMap.put("slategrey", 0x708090);
x11ColorMap.put("snow", 0xFFFAFA);
x11ColorMap.put("springgreen", 0x00FF7F);
x11ColorMap.put("steelblue", 0x4682B4);
x11ColorMap.put("tan", 0xD2B48C);
x11ColorMap.put("teal", 0x008080);
x11ColorMap.put("thistle", 0xD8BFD8);
x11ColorMap.put("tomato", 0xFF6347);
x11ColorMap.put("turquoise", 0x40E0D0);
x11ColorMap.put("violet", 0xEE82EE);
x11ColorMap.put("wheat", 0xF5DEB3);
x11ColorMap.put("white", 0xFFFFFF);
x11ColorMap.put("whitesmoke", 0xF5F5F5);
x11ColorMap.put("yellow", 0xFFFF00);
x11ColorMap.put("yellowgreen", 0x9ACD32);
}
static Document sanitize(Context context, String html, boolean show_images, boolean autolink) {
try {
return _sanitize(context, html, show_images, autolink);
} catch (Throwable ex) {
// OutOfMemoryError
Log.e(ex);
Document document = Document.createShell("");
Element strong = document.createElement("strong");
strong.text(Log.formatThrowable(ex));
document.body().appendChild(strong);
return document;
}
}
private static Document _sanitize(Context context, String html, boolean show_images, boolean autolink) {
SharedPreferences prefs = PreferenceManager.getDefaultSharedPreferences(context);
boolean text_color = prefs.getBoolean("text_color", true);
boolean display_hidden = prefs.getBoolean("display_hidden", false);
boolean disable_tracking = prefs.getBoolean("disable_tracking", true);
Document parsed = JsoupEx.parse(html);
//
//
// Default XHTML namespace: http://www.w3.org/1999/xhtml
String ns = null;
for (Element h : parsed.select("html"))
for (Attribute a : h.attributes()) {
String key = a.getKey();
String value = a.getValue();
if (value != null &&
key.startsWith("xmlns:") &&
value.startsWith("http://www.w3.org/")) {
ns = key.split(":")[1];
break;
}
}
for (Element e : parsed.select("*")) {
String tag = e.tagName();
if (tag.contains(":")) {
if (ns != null && tag.startsWith(ns)) {
e.tagName(tag.split(":")[1]);
Log.i("Updated tag=" + tag + " to=" + e.tagName());
} else {
e.remove();
Log.i("Removed tag=" + tag);
}
}
}
Whitelist whitelist = Whitelist.relaxed()
.addTags("hr", "abbr", "big", "font")
.removeTags("col", "colgroup", "thead", "tbody")
.removeAttributes("table", "width")
.removeAttributes("td", "colspan", "rowspan", "width")
.removeAttributes("th", "colspan", "rowspan", "width")
.addProtocols("img", "src", "cid")
.addProtocols("img", "src", "data");
if (text_color)
whitelist
.addAttributes(":all", "style")
.addAttributes("font", "color");
final Document document = new Cleaner(whitelist).clean(parsed);
boolean dark = Helper.isDarkTheme(context);
// Font
for (Element font : document.select("font")) {
String color = font.attr("color");
if (Build.VERSION.SDK_INT >= Build.VERSION_CODES.N)
font.removeAttr("color");
font.removeAttr("face");
font.attr("style", "color:" + color + ";");
font.tagName("span");
}
// Sanitize styles
for (Element element : document.select("*")) {
String style = element.attr("style");
if (!TextUtils.isEmpty(style)) {
StringBuilder sb = new StringBuilder();
String[] params = style.split(";");
for (String param : params) {
String[] kv = param.split(":");
if (kv.length == 2) {
String key = kv[0].trim().toLowerCase(Locale.ROOT);
String value = kv[1].toLowerCase(Locale.ROOT)
.replaceAll("\\s", "");
switch (key) {
case "color":
String c = value
.replace("none", "")
.replace("unset", "")
.replace("inherit", "")
.replace("initial", "")
.replace("windowtext", "")
.replace("transparent", "")
.replace("!important", "")
.replaceAll("[^a-z0-9]", "");
Integer color = null;
try {
if (TextUtils.isEmpty(c))
; // Do nothing
else if (c.startsWith("#"))
color = Integer.decode(c) | 0xFF000000;
else if (c.startsWith("rgb")) {
int s = c.indexOf("(");
int e = c.indexOf(")");
if (s > 0 && e > s) {
String[] rgb = c.substring(s + 1, e).split(",");
if (rgb.length == 3)
color = Color.rgb(
Integer.parseInt(rgb[0]),
Integer.parseInt(rgb[1]),
Integer.parseInt(rgb[2])
);
}
} else if (x11ColorMap.containsKey(c))
color = x11ColorMap.get(c);
else
try {
color = Color.parseColor(c);
} catch (IllegalArgumentException ex) {
color = Integer.decode("#" + c) | 0xFF000000;
}
} catch (Throwable ex) {
Log.e("Color=" + c + ": " + ex);
}
if (color != null && !(dark && color == Color.BLACK)) {
color = Helper.adjustLuminance(color, dark, MIN_LUMINANCE);
c = String.format("#%06x", color & 0xFFFFFF);
sb.append("color:").append(c).append(";");
if (Build.VERSION.SDK_INT < Build.VERSION_CODES.N)
element.attr("color", c);
}
break;
case "background":
case "background-color":
break;
case "line-through":
sb.append(param).append(";");
break;
case "display":
if (!display_hidden && "none".equals(value)) {
Log.i("Removing element " + element.tagName());
element.empty();
}
if ("inline".equals(value) || "inline-block".equals(value))
element.attr("inline", "true");
break;
case "height":
case "width":
//case "font-size":
//case "line-height":
if (!display_hidden &&
("0".equals(value) || "0px".equals(value))) {
Log.i("Removing element " + element.tagName());
element.empty();
}
break;
}
}
}
if (sb.length() == 0)
element.removeAttr("style");
else
element.attr("style", sb.toString());
}
}
// Remove new lines without surrounding content
//for (Element br : document.select("br"))
// if (br.parent() != null && !hasVisibleContent(br.parent().childNodes()))
// br.tagName("span");
for (Element div : document.select("div"))
if (div.children().select("div").size() == 0 &&
hasVisibleContent(div.childNodes())) {
Node last = div.childNode(div.childNodeSize() - 1);
if (last != null && "br".equals(last.nodeName()))
last.remove();
}
// Paragraphs
for (Element p : document.select("p")) {
p.appendElement("br");
p.tagName("div");
}
// Short quotes
for (Element q : document.select("q")) {
q.prependText("\"");
q.appendText("\"");
q.tagName("em");
}
// Pre formatted text
for (Element pre : document.select("pre")) {
pre.html(formatPre(pre.wholeText()));
pre.tagName("tt");
}
// Code
document.select("code").tagName("strong");
// Lines
for (Element hr : document.select("hr")) {
hr.tagName("div");
hr.text("----------------------------------------");
}
// Descriptions
document.select("dl").tagName("div");
for (Element dt : document.select("dt")) {
dt.tagName("strong");
dt.appendElement("br");
}
for (Element dd : document.select("dd")) {
dd.tagName("em");
dd.appendElement("br").appendElement("br");
}
// Abbreviations
document.select("abbr").tagName("u");
// Subscript/Superscript
for (Element subp : document.select("sub,sup")) {
Element small = document.createElement("small");
small.html(subp.html());
subp.html(small.outerHtml());
}
// Lists
for (Element li : document.select("li")) {
li.tagName("span");
li.prependText("* ");
li.appendElement("br"); // line break after list item
}
document.select("ol").tagName("div");
document.select("ul").tagName("div");
// Tables
for (Element col : document.select("th,td")) {
// separate columns
if (hasVisibleContent(col.childNodes()))
if (col.nextElementSibling() != null)
col.appendText(" ");
if ("th".equals(col.tagName()))
col.tagName("strong");
else
col.tagName("span");
}
for (Element row : document.select("tr")) {
row.tagName("span");
if (hasVisibleContent(row.childNodes())) {
Element next = row.nextElementSibling();
if (next != null && "tr".equals(next.tagName()))
row.appendElement("br");
}
}
document.select("caption").tagName("div");
for (Element table : document.select("table"))
if (table.parent() != null && "a".equals(table.parent().tagName()))
table.tagName("span"); // Links cannot contain tables
else
table.tagName("div");
// Remove tracking pixels
if (disable_tracking)
removeTrackingPixels(context, document);
// Images
for (Element img : document.select("img")) {
String alt = img.attr("alt");
String src = img.attr("src");
String tracking = img.attr("tracking");
if (!show_images && !TextUtils.isEmpty(alt))
if (TextUtils.isEmpty(tracking))
img.appendText(" " + alt + " ");
else {
img.append(" ");
Element a = document.createElement("a");
a.attr("href", tracking);
a.text(alt);
img.appendChild(a);
img.appendText(" ");
}
// Annotate source with width and height
if (!TextUtils.isEmpty(src)) {
int width = 0;
int height = 0;
String awidth = img.attr("width");
for (int i = 0; i < awidth.length(); i++)
if (Character.isDigit(awidth.charAt(i)))
width = width * 10 + (byte) awidth.charAt(i) - (byte) '0';
else
break;
String aheight = img.attr("height");
for (int i = 0; i < aheight.length(); i++)
if (Character.isDigit(aheight.charAt(i)))
height = height * 10 + (byte) aheight.charAt(i) - (byte) '0';
else
break;
if (width != 0 || height != 0) {
ImageHelper.AnnotatedSource a = new ImageHelper.AnnotatedSource(
src, width, height, !TextUtils.isEmpty(tracking));
img.attr("src", a.getAnnotated());
}
}
}
// Autolink
if (autolink) {
final Pattern pattern = Pattern.compile(
PatternsCompat.AUTOLINK_EMAIL_ADDRESS.pattern() + "|" +
PatternsCompat.AUTOLINK_WEB_URL.pattern());
NodeTraversor.traverse(new NodeVisitor() {
private int links = 0;
@Override
public void head(Node node, int depth) {
if (links < MAX_AUTO_LINK && node instanceof TextNode) {
TextNode tnode = (TextNode) node;
String text = tnode.getWholeText();
Matcher matcher = pattern.matcher(text);
if (matcher.find()) {
Element span = document.createElement("span");
int pos = 0;
do {
boolean linked = false;
Node parent = tnode.parent();
while (parent != null) {
if ("a".equals(parent.nodeName())) {
linked = true;
break;
}
parent = parent.parent();
}
boolean email = matcher.group().contains("@") && !matcher.group().contains(":");
Log.d("Web url=" + matcher.group() +
" " + matcher.start() + "..." + matcher.end() + "/" + text.length() +
" linked=" + linked + " email=" + email + " count=" + links);
if (linked)
span.appendText(text.substring(pos, matcher.end()));
else {
span.appendText(text.substring(pos, matcher.start()));
Element a = document.createElement("a");
a.attr("href", (email ? "mailto:" : "") + matcher.group());
a.text(matcher.group());
span.appendChild(a);
links++;
}
pos = matcher.end();
} while (links < MAX_AUTO_LINK && matcher.find());
span.appendText(text.substring(pos));
tnode.before(span);
tnode.text("");
}
}
}
@Override
public void tail(Node node, int depth) {
}
}, document);
}
// Selective new lines
for (Element div : document.select("div"))
if (!Boolean.parseBoolean(div.attr("inline")) &&
div.children().select("div").size() == 0 &&
hasVisibleContent(div.childNodes())) {
div.appendElement("br");
}
for (Element div : document.select("div"))
div.tagName("span");
if (Build.VERSION.SDK_INT < Build.VERSION_CODES.N)
for (Element span : document.select("span"))
if (!TextUtils.isEmpty(span.attr("color")))
span.tagName("font");
if (document.body() == null) {
Log.e("Sanitize without body");
document.normalise();
}
return document;
}
private static boolean hasVisibleContent(List nodes) {
for (Node node : nodes)
if (node instanceof TextNode && !((TextNode) node).isBlank())
return true;
else if (node instanceof Element) {
Element element = (Element) node;
if (!element.isBlock() &&
(element.hasText() || element.selectFirst("img") != null))
return true;
}
return false;
}
static String formatPre(String text) {
int level = 0;
StringBuilder sb = new StringBuilder();
String[] lines = text.split("\\r?\\n");
for (String line : lines) {
// Opening quotes
int tlevel = 0;
while (line.startsWith(">")) {
tlevel++;
if (tlevel > level)
sb.append("");
line = line.substring(1); // >
if (line.startsWith(" "))
line = line.substring(1);
}
// Closing quotes
for (int i = 0; i < level - tlevel; i++)
sb.append("
");
level = tlevel;
// Tabs characters
StringBuilder l = new StringBuilder();
for (int j = 0; j < line.length(); j++) {
char kar = line.charAt(j);
if (kar == '\t') {
l.append(' ');
while (l.length() % TAB_SIZE != 0)
l.append(' ');
} else
l.append(kar);
}
line = l.toString();
// Html characters
line = Html.escapeHtml(line);
// Space characters
int len = line.length();
for (int j = 0; j < len; j++) {
char kar = line.charAt(j);
if (kar == ' ') {
// Prevent trimming start
// Keep one space for word wrapping
if (j == 0 || (j + 1 < len && line.charAt(j + 1) == ' '))
sb.append(" ");
else
sb.append(' ');
} else
sb.append(kar);
}
sb.append("
");
}
// Closing quotes
for (int i = 0; i < level; i++)
sb.append("");
return sb.toString();
}
static void removeTrackingPixels(Context context, Document document) {
Drawable d = ContextCompat.getDrawable(context, R.drawable.baseline_my_location_24);
d.setTint(Helper.resolveColor(context, R.attr.colorWarning));
Bitmap bm = Bitmap.createBitmap(d.getIntrinsicWidth(), d.getIntrinsicHeight(), Bitmap.Config.ARGB_8888);
Canvas c = new Canvas(bm);
d.setBounds(0, 0, c.getWidth(), c.getHeight());
d.draw(c);
ByteArrayOutputStream bos = new ByteArrayOutputStream();
bm.compress(Bitmap.CompressFormat.PNG, 100, bos);
StringBuilder sb = new StringBuilder();
sb.append("data:image/png;base64,");
sb.append(Base64.encodeToString(bos.toByteArray(), Base64.NO_WRAP));
// Build list of allowed hosts
List hosts = new ArrayList<>();
for (Element img : document.select("img")) {
String src = img.attr("src");
if (!TextUtils.isEmpty(src) && !isTrackingPixel(img)) {
Uri uri = Uri.parse(img.attr("src"));
String host = uri.getHost();
if (host != null && !hosts.contains(host))
hosts.add(host);
}
}
// Images
for (Element img : document.select("img")) {
img.removeAttr("tracking");
String src = img.attr("src");
if (!TextUtils.isEmpty(src) && isTrackingPixel(img)) {
Uri uri = Uri.parse(src);
String host = uri.getHost();
if (host == null || !hosts.contains(host)) {
img.attr("src", sb.toString());
img.attr("alt", context.getString(R.string.title_legend_tracking_pixel));
img.attr("height", "24");
img.attr("width", "24");
img.attr("style", "display:block !important; width:24px !important; height:24px !important;");
img.attr("tracking", src);
}
}
}
}
private static boolean isTrackingPixel(Element img) {
String width = img.attr("width").trim();
String height = img.attr("height").trim();
if (TextUtils.isEmpty(width) || TextUtils.isEmpty(height))
return false;
try {
return (Integer.parseInt(width) * Integer.parseInt(height) <= TRACKING_PIXEL_SURFACE);
} catch (NumberFormatException ignored) {
return false;
}
}
static void embedInlineImages(Context context, long id, Document document) throws IOException {
DB db = DB.getInstance(context);
for (Element img : document.select("img")) {
String src = img.attr("src");
if (src.startsWith("cid:")) {
String cid = '<' + src.substring(4) + '>';
EntityAttachment attachment = db.attachment().getAttachment(id, cid);
if (attachment != null && attachment.available) {
File file = attachment.getFile(context);
try (InputStream is = new FileInputStream(file)) {
byte[] bytes = new byte[(int) file.length()];
if (is.read(bytes) != bytes.length)
throw new IOException("length");
StringBuilder sb = new StringBuilder();
sb.append("data:");
sb.append(attachment.type);
sb.append(";base64,");
sb.append(Base64.encodeToString(bytes, Base64.NO_WRAP));
img.attr("src", sb.toString());
}
}
}
}
}
static void setViewport(Document document) {
// https://developer.mozilla.org/en-US/docs/Mozilla/Mobile/Viewport_meta_tag
document.head().select("meta").select("[name=viewport]").remove();
document.head().prependChild(document.createElement("meta")
.attr("name", "viewport")
.attr("content", "width=device-width, initial-scale=1.0"));
Log.i(document.head().html());
}
static String getPreview(String body) {
try {
return _getPreview(body);
} catch (OutOfMemoryError ex) {
Log.e(ex);
return null;
}
}
private static String _getPreview(String body) {
if (body == null)
return null;
String text = JsoupEx.parse(body).text();
String preview = text.substring(0, Math.min(text.length(), PREVIEW_SIZE));
if (preview.length() < text.length())
preview += "…";
return preview;
}
static String getText(String html) {
final StringBuilder sb = new StringBuilder();
html = html.replace("
", "
");
NodeTraversor.traverse(new NodeVisitor() {
private int qlevel = 0;
private int tlevel = 0;
private int plevel = 0;
private int lindex = 0;
public void head(Node node, int depth) {
if (node instanceof TextNode)
if (plevel > 0) {
String[] lines = ((TextNode) node).getWholeText().split("\\r?\\n");
for (String line : lines) {
append(line, true);
newline();
}
} else
append(((TextNode) node).text());
else {
String name = node.nodeName();
if ("li".equals(name))
append("*");
else if ("blockquote".equals(name))
qlevel++;
else if ("pre".equals(name))
plevel++;
if (heads.contains(name))
newline();
}
}
public void tail(Node node, int depth) {
String name = node.nodeName();
if ("a".equals(name))
append("[" + node.attr("href") + "]");
else if ("img".equals(name))
append("[" + node.attr("src") + "]");
else if ("th".equals(name) || "td".equals(name)) {
Node next = node.nextSibling();
if (next == null || !("th".equals(next.nodeName()) || "td".equals(next.nodeName())))
newline();
else
append(" ");
} else if ("blockquote".equals(name))
qlevel--;
else if ("pre".equals(name))
plevel--;
if (tails.contains(name))
newline();
}
private void append(String text) {
append(text, false);
}
private void append(String text, boolean raw) {
if (tlevel != qlevel) {
newline();
tlevel = qlevel;
}
if (!raw && !"-- ".equals(text)) {
text = text.trim();
if (lindex > 0)
text = " " + text;
}
sb.append(text);
lindex += text.length();
}
private void newline() {
lindex = 0;
sb.append("\n");
for (int i = 0; i < qlevel; i++)
sb.append("> ");
}
}, JsoupEx.parse(html));
sb.append("\n");
return sb.toString();
}
static Spanned highlightHeaders(Context context, String headers) {
int colorAccent = Helper.resolveColor(context, R.attr.colorAccent);
SpannableStringBuilder ssb = new SpannableStringBuilder(headers);
int index = 0;
for (String line : headers.split("\n")) {
if (line.length() > 0 && !Character.isWhitespace(line.charAt(0))) {
int colon = line.indexOf(':');
if (colon > 0)
ssb.setSpan(new ForegroundColorSpan(colorAccent), index, index + colon, 0);
}
index += line.length() + 1;
}
return ssb;
}
static Spanned fromHtml(@NonNull String html) {
return fromHtml(html, null, null);
}
static Spanned fromHtml(@NonNull String html, @Nullable Html.ImageGetter imageGetter, @Nullable Html.TagHandler tagHandler) {
Spanned spanned = HtmlCompat.fromHtml(html, FROM_HTML_SEPARATOR_LINE_BREAK_LIST_ITEM, imageGetter, tagHandler);
int i = spanned.length();
while (i > 1 && spanned.charAt(i - 2) == '\n' && spanned.charAt(i - 1) == '\n')
i--;
if (i != spanned.length())
spanned = (Spanned) spanned.subSequence(0, i);
return spanned;
}
static String toHtml(Spanned spanned) {
String html = HtmlCompat.toHtml(spanned, TO_HTML_PARAGRAPH_LINES_CONSECUTIVE);
// @Google: why convert size to and from in a different way?
Document doc = JsoupEx.parse(html);
for (Element element : doc.select("span")) {
String style = element.attr("style");
if (style.startsWith("font-size:")) {
int colon = style.indexOf(':');
int semi = style.indexOf("em;", colon);
if (semi > colon)
try {
String hsize = style.substring(colon + 1, semi).replace(',', '.');
float size = Float.parseFloat(hsize);
element.tagName(size < 1.0f ? "small" : "big");
element.attributes().remove("style");
} catch (NumberFormatException ex) {
Log.e(ex);
}
}
}
return doc.html();
}
}