Nhờ câu trả lời của Corey ở trên và một ngày thứ bảy lười biếng với quá nhiều thời gian trên tay, giờ đây tôi có thể thấy danh sách các thông báo Chrome gần đây trong bảng điều khiển IDE của mình, nơi tôi thậm chí có thể nhấp vào URL.
Mã này là crappy và sử dụng heuristic thô vì tôi không có manh mối về cách chính xác để giải thích dữ liệu nhị phân.
Nhưng đó là một tấn còn hơn không. Ví dụ đầu ra (đoạn trích):
https://www.finanzen.net/nachricht/aktien/kw-9-tops-und-flops-der-tecdax-aktien-in-der-vergangenen-woche-7195100
https://images.finanzen.net/mediacenter/unsortiert/TecDAX_boerse_frankfurt0016_kl.jpg
So bewegten sich die Einzelwerte des TecDAX in der zurückliegenden Handelswoche.*
KW 9: Tops und Flops der TecDAX-Aktien in der vergangenen Woche
So bewegten sich die Einzelwerte des TecDAX in der zurückliegenden Handelswoche.
HideOnTheseRoutes
Home/Index;Article/News/Index
tag-7195100
NotificationIdentifier
1061622960{
https://www.youtube.com/watch?v=W-mlD_bYKdU&feature=push-u-sub&attr_tag=0SL8UpnrTOnTECxr%3A6
https://lh5.googleusercontent.com/-raJM5SITO34/AAAAAAAAAAI/AAAAAAAAAAA/UtLljlL4Wpc/s96-c-mo/photo.jpg
New from Market Moves
Trade Recap: $1,500 in PROFITS*˜
COuAyJGY4uACEAY=
attributionTag
0SL8UpnrTOnTECxr:6{
from Market MovesTrade Recap: $1,500 in PROFITS
Mã Java xứng đáng đóng đinh:
import java.io.BufferedInputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.nio.charset.Charset;
import java.util.ArrayList;
import java.util.Collections;
import java.util.List;
import java.util.function.Consumer;
/**
* v[1, 2019-03-02 13:00 UTC]
*
* by dreamspace-president.com
*/
final public class CrappyChromeNotificationHistoryReader {
public static void main(final String[] args) {
final File file = new File(
"C:\\Users\\[YOUR_NAME_HERE]\\AppData\\Local\\Google\\Chrome\\User Data\\Default\\Platform Notifications\\000003.log");
final List<ChromeNotificationStuff> notifications = obtainChromeNotificationStuff(file);
for (ChromeNotificationStuff notification : notifications) {
System.err.println();
System.err.println(notification);
}
System.exit(0);
}
public static List<ChromeNotificationStuff> obtainChromeNotificationStuff(final File file) {
final List<ChromeNotificationStuff> ret = new ArrayList<>();
final List<DumbTokenList> listOfDumbTokenLists = doTheInsaneParsingThing(file);
int instanceCounter = 0;
for (DumbTokenList dtl : listOfDumbTokenLists) {
final List<String> urls = new ArrayList<>();
final List<String> texts = new ArrayList<>();
for (String token : dtl.tokens) {
if (token.startsWith("https://") || token.startsWith("http://")) {
urls.add(token);
} else {
texts.add(token);
}
}
// Remove unimportant URLs.
for (int i = urls.size() - 1; i > 0; i--) {
final String urlThis = urls.get(i);
final int lenThis = urlThis.length();
for (int ii = i - 1; ii >= 0; ii--) {
final String urlThat = urls.get(ii);
final int lenThat = urlThat.length();
if (lenThis > lenThat) {
if (urlThis.startsWith(urlThat)) {
final String removed = urls.remove(ii);
// System.err.println("\nREMOVED: " + removed + "\nKEPT : " + urlThis); // because was better or equal
break;
}
} else {
if (urlThat.startsWith(urlThis)) {
final String removed = urls.remove(i);
// System.err.println("\nREMOVED: " + removed + "\nKEPT : " + urlThat); // because was better or equal
break;
}
}
}
}
ret.add(new ChromeNotificationStuff(instanceCounter, urls, texts));
instanceCounter++;
}
ret.sort(null);
return ret;
}
final public static class ChromeNotificationStuff implements Comparable<ChromeNotificationStuff> {
private final int instanceCounter;
final public List<String> urls;
final public List<String> texts;
private ChromeNotificationStuff(final int instanceCounter,
final List<String> urls,
final List<String> texts) {
this.instanceCounter = instanceCounter;
this.urls = Collections.unmodifiableList(urls);
this.texts = Collections.unmodifiableList(texts);
}
public String toString() {
final StringBuilder sb = new StringBuilder();
for (String url : urls) {
sb.append(url).append('\n');
}
for (String text : texts) {
sb.append(text).append('\n');
}
return sb.toString();
}
@Override
public int compareTo(final ChromeNotificationStuff o) { // Newest (= last) notifications first, please.
return Integer.compare(o.instanceCounter, instanceCounter);
}
}
final private static double MIN_LENGTH_DIFFERENCE_RATIO = 0.7;//0.9;
final private static double MIN_REMAININGLINES_PERCENTAGEOF_ALLLINES = 0.2;
final private static class DumbTokenList {
final private static int MIN_LENGTH = 10; //6;
final private static String[] EXTENSIONS = new String[] { ".jpg", ".jpeg", ".png", ".gif", ".html", ".htm", ".php" };
final private static int MAX_EXTRA_CRAP_AFTER_EXTENSIONS = 3;
final private static String SAFE_URL_CHARACTERS = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-._~:/?#[]@!$&'()*+,;="; // https://stackoverflow.com/a/1547940/3500521
final private String originalText;
final private List<String> tokens;
private DumbTokenList(final String textWithBinaryCrap) {
originalText = textWithBinaryCrap;
final List<String> tokens = new ArrayList<>();
final Consumer<String> addTokenButTryToDecrappifyExtensionsFirstAnTing = token -> {
if (token.startsWith("ttps://") || token.startsWith("ttp://")) {
token = "h" + token;
}
final List<String> newTokens = new ArrayList<>();
if (token.startsWith("http")) {
final int tokenLength = token.length();
boolean found = false;
for (int i = 0; i < tokenLength; i++) {
final char c = token.charAt(i);
if (SAFE_URL_CHARACTERS.indexOf(c) < 0) {
newTokens.add(token.substring(0, i));
newTokens.add(token.substring(i));
found = true;
break;
}
}
if (!found) {
newTokens.add(token);
}
} else {
newTokens.add(token);
}
for (String newToken : newTokens) {
String foundExt = null;
int foundExtLen = 0;
int foundExtAt = -1;
for (String extension : EXTENSIONS) {
final int idx = newToken.indexOf(extension);
if (idx >= 0) {
final int extLen = extension.length();
if (idx > foundExtAt || (idx == foundExtAt && extLen > foundExtLen)) {
foundExt = extension;
foundExtLen = extLen;
foundExtAt = idx;
}
}
}
if (foundExt != null) {
final int amountOfCharactersAfterThisFind = newToken.length() - foundExtAt - foundExtLen;
if (amountOfCharactersAfterThisFind <= MAX_EXTRA_CRAP_AFTER_EXTENSIONS) {
// OK. Shorten this bitch.
newToken = newToken.substring(0, foundExtAt + foundExtLen);
}
}
if (newToken.startsWith("http")) {
if (!newToken.startsWith("http://") && !newToken.startsWith("https://")) {
continue;
}
}
if (newToken.startsWith("/watch?v=")) {
newToken = "https://www.youtube.com" + newToken;
}
if (newToken.length() >= MIN_LENGTH) {
tokens.add(newToken);
}
}
};
final StringBuilder sb = new StringBuilder();
final int len = textWithBinaryCrap.length();
for (int i = 0; i <= len + 1; i++) {
final char c = i < len ? textWithBinaryCrap.charAt(i) : 0;
if (c < ' ' || c == '"') {
String potentialText = sb.toString();
while (true) {
final int httpIDX = potentialText.indexOf("http", 1);
if (httpIDX < 0) {
addTokenButTryToDecrappifyExtensionsFirstAnTing.accept(potentialText);
break;
} else {
final String snippet = potentialText.substring(0, httpIDX);
potentialText = potentialText.substring(httpIDX);
addTokenButTryToDecrappifyExtensionsFirstAnTing.accept(snippet);
}
}
sb.setLength(0);
if (c == '"') {
// Skip this and the next. (thus "i < len +1")
i++;
}
} else {
sb.append(c);
}
}
// Remove quasi-duplicates. Sue me.
// System.err.println("\n*** STARTING DEDUPLICATION ***");
final int lSize = tokens.size();
for (int i = lSize - 1; i > 0; i--) { // (not 0 itself, wouldn't make sense)
if (i < tokens.size()) {
final String entry = tokens.get(i);
for (int ii = i - 1; ii >= 0; ii--) { // (incl. 0)
final String otherEntry = tokens.get(ii);
final Boolean removeNoneOrFirstOrSecond = areLinesTooSimilar(entry, otherEntry);
if (removeNoneOrFirstOrSecond != null) {
if (!removeNoneOrFirstOrSecond) {
final String removed = tokens.remove(i);
// System.err.println("\nREMOVED: " + removed + "\nKEPT : " + otherEntry); // because was better or equal
} else {
final String removed = tokens.remove(ii);
// System.err.println("\nREMOVED: " + removed + "\nKEPT : " + entry); // because was better or equal
}
break; // IMPORTANT!
}
}
}
}
this.tokens = Collections.unmodifiableList(tokens);
}
public String toString() {
final StringBuilder sb = new StringBuilder();
for (String token : tokens) {
sb.append(token).append('\n');
}
return sb.toString();
}
}
/**
* Do NOT call with NULL/EMPTY arguments.
*
* @return NULL if not too similar. False if the FIRST seems superfluous. True if the SECOND seems superfluous.
*/
private static Boolean areLinesTooSimilar(final String line1,
final String line2) {
final int l1 = line1.length();
final int l2 = line2.length();
final double lenDiffRatio = Math.min(l1, l2) / (double) Math.max(l1, l2); // Results in 1 or less.
if (lenDiffRatio >= MIN_LENGTH_DIFFERENCE_RATIO) {
if (l2 < l1) {
// Compare the other way round.
if (line1.contains(line2)) {
return false;
}
} else {
if (line2.contains(line1)) {
return true;
}
}
}
return null;
}
private static List<DumbTokenList> doTheInsaneParsingThing(final File file) {
final List<DumbTokenList> ret = new ArrayList<>();
final StringBuilder sb = new StringBuilder();
try (final InputStream is = new BufferedInputStream(new FileInputStream(file))) {
final int bufMinus1 = 4;
final Charset charset = Charset.forName("Cp1252"); // =ansi
final int[] buf = new int[bufMinus1 + 1]; // "DATA"
// while ((buf[buf.length - 1] = is.read()) >= 0) {
while (true) {
buf[bufMinus1] = is.read();
if (buf[bufMinus1] < 0 || (
buf[0] == 'D' &&
buf[1] == 'A' &&
buf[2] == 'T' &&
buf[3] == 'A' &&
buf[4] == ':')) {
if (sb.length() > 0) {
ret.add(new DumbTokenList(sb.toString()));
sb.setLength(0);
}
if (buf[bufMinus1] < 0) {
break;
}
} else {
sb.append(new String(new byte[] { (byte) buf[bufMinus1] }, charset));
// sb.append((char) buf[bufMinus1]);
}
// Shift minibuffer to front.
for (int i = 0; i < bufMinus1; i++) {
buf[i] = buf[i + 1];
}
}
} catch (IOException e) {
e.printStackTrace();
}
// DEDUPLICATE DTLs
for (int i = ret.size() - 1; i > 0; i--) {
if (i < ret.size()) {
final DumbTokenList dtlThis = ret.get(i);
final int dtlThisTokenCount = dtlThis.tokens.size();
for (int ii = i - 1; ii >= 0; ii--) {
final DumbTokenList dtlThat = ret.get(ii);
final int dtlThatTokenCount = dtlThat.tokens.size();
int scoreViaRemainingLines_this = dtlThisTokenCount;
int scoreViaRemainingLines_that = dtlThatTokenCount;
for (int o = 0; o < dtlThisTokenCount; o++) {
final String tokenThis = dtlThis.tokens.get(o);
for (int oo = 0; oo < dtlThatTokenCount; oo++) {
final String tokenThat = dtlThat.tokens.get(oo);
final Boolean tooSimilar = areLinesTooSimilar(tokenThis, tokenThat);
if (tooSimilar != null) {
scoreViaRemainingLines_this--;
scoreViaRemainingLines_that--;
break;
}
}
}
if (scoreViaRemainingLines_this < 0 || scoreViaRemainingLines_that < 0) {
throw new Error();
}
final double scoreActual_this = scoreViaRemainingLines_this / (double) dtlThisTokenCount;
final double scoreActual_that = scoreViaRemainingLines_that / (double) dtlThatTokenCount;
if (scoreViaRemainingLines_this < scoreViaRemainingLines_that) {
if (scoreActual_this < MIN_REMAININGLINES_PERCENTAGEOF_ALLLINES) {
final DumbTokenList removed = ret.remove(i);
// System.err.println("\nREMOVED:\n" + removed + "\nKEPT :\n" + dtlThat);
break; // IMPORTANT.
}
} else {
if (scoreActual_that < MIN_REMAININGLINES_PERCENTAGEOF_ALLLINES) {
final DumbTokenList removed = ret.remove(ii);
// System.err.println("\nREMOVED:\n" + removed + "\nKEPT :\n" + dtlThis);
break; // IMPORTANT.
}
}
}
}
}
return ret;
}
}