2016-10-09 19:14:02 +00:00
|
|
|
"use strict";
|
|
|
|
|
2016-12-09 20:46:53 +00:00
|
|
|
const cheerio = require("cheerio");
|
|
|
|
const Msg = require("../../models/msg");
|
|
|
|
const request = require("request");
|
|
|
|
const Helper = require("../../helper");
|
|
|
|
const es = require("event-stream");
|
2014-09-27 19:17:05 +00:00
|
|
|
|
2015-04-29 19:55:13 +00:00
|
|
|
process.setMaxListeners(0);
|
|
|
|
|
2016-12-09 20:46:53 +00:00
|
|
|
module.exports = function(client, chan, originalMsg) {
|
|
|
|
if (!Helper.config.prefetch) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
const links = originalMsg.text
|
|
|
|
.replace(/\x02|\x1D|\x1F|\x16|\x0F|\x03(?:[0-9]{1,2}(?:,[0-9]{1,2})?)?/g, "")
|
|
|
|
.split(" ")
|
2017-04-08 12:34:31 +00:00
|
|
|
.filter((w) => /^https?:\/\//.test(w));
|
2016-12-09 20:46:53 +00:00
|
|
|
|
|
|
|
if (links.length === 0) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2017-04-08 12:34:31 +00:00
|
|
|
const msg = new Msg({
|
2016-12-09 20:46:53 +00:00
|
|
|
type: Msg.Type.TOGGLE,
|
|
|
|
time: originalMsg.time,
|
|
|
|
self: originalMsg.self,
|
|
|
|
});
|
|
|
|
chan.pushMessage(client, msg);
|
|
|
|
|
|
|
|
const link = escapeHeader(links[0]);
|
|
|
|
fetch(link, function(res) {
|
|
|
|
parse(msg, link, res, client);
|
2014-09-27 19:17:05 +00:00
|
|
|
});
|
|
|
|
};
|
|
|
|
|
2014-09-27 23:47:04 +00:00
|
|
|
function parse(msg, url, res, client) {
|
|
|
|
var toggle = msg.toggle = {
|
|
|
|
id: msg.id,
|
|
|
|
type: "",
|
|
|
|
head: "",
|
|
|
|
body: "",
|
2014-10-12 01:42:30 +00:00
|
|
|
thumb: "",
|
2016-11-25 17:57:47 +00:00
|
|
|
link: url,
|
2014-09-27 23:47:04 +00:00
|
|
|
};
|
|
|
|
|
2014-09-27 19:17:05 +00:00
|
|
|
switch (res.type) {
|
|
|
|
case "text/html":
|
2014-12-21 23:26:55 +00:00
|
|
|
var $ = cheerio.load(res.text);
|
2014-09-27 23:47:04 +00:00
|
|
|
toggle.type = "link";
|
|
|
|
toggle.head = $("title").text();
|
2014-10-14 18:51:27 +00:00
|
|
|
toggle.body =
|
2015-09-30 22:39:57 +00:00
|
|
|
$("meta[name=description]").attr("content")
|
|
|
|
|| $("meta[property=\"og:description\"]").attr("content")
|
2014-10-14 18:51:27 +00:00
|
|
|
|| "No description found.";
|
2014-12-11 23:48:43 +00:00
|
|
|
toggle.thumb =
|
2015-09-30 22:39:57 +00:00
|
|
|
$("meta[property=\"og:image\"]").attr("content")
|
|
|
|
|| $("meta[name=\"twitter:image:src\"]").attr("content")
|
2014-10-14 18:51:27 +00:00
|
|
|
|| "";
|
2014-09-27 19:17:05 +00:00
|
|
|
break;
|
|
|
|
|
|
|
|
case "image/png":
|
|
|
|
case "image/gif":
|
|
|
|
case "image/jpg":
|
|
|
|
case "image/jpeg":
|
2016-06-08 09:26:24 +00:00
|
|
|
if (res.size < (Helper.config.prefetchMaxImageSize * 1024)) {
|
2015-09-30 22:15:53 +00:00
|
|
|
toggle.type = "image";
|
2016-05-01 09:41:17 +00:00
|
|
|
} else {
|
2015-09-30 22:15:53 +00:00
|
|
|
return;
|
|
|
|
}
|
2014-09-27 19:17:05 +00:00
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
return;
|
|
|
|
}
|
2014-09-27 23:47:04 +00:00
|
|
|
|
|
|
|
client.emit("toggle", toggle);
|
2014-09-27 19:17:05 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
function fetch(url, cb) {
|
2016-10-09 08:54:44 +00:00
|
|
|
let req;
|
2015-01-04 02:58:12 +00:00
|
|
|
try {
|
2016-10-09 08:54:44 +00:00
|
|
|
req = request.get({
|
2016-01-24 10:43:00 +00:00
|
|
|
url: url,
|
2016-03-25 09:45:39 +00:00
|
|
|
maxRedirects: 5,
|
|
|
|
timeout: 5000,
|
2016-01-24 10:43:00 +00:00
|
|
|
headers: {
|
2016-02-10 05:45:21 +00:00
|
|
|
"User-Agent": "Mozilla/5.0 (compatible; The Lounge IRC Client; +https://github.com/thelounge/lounge)"
|
2016-01-24 10:43:00 +00:00
|
|
|
}
|
|
|
|
});
|
2015-09-30 22:39:57 +00:00
|
|
|
} catch (e) {
|
2015-01-04 02:58:12 +00:00
|
|
|
return;
|
|
|
|
}
|
2014-12-21 23:26:55 +00:00
|
|
|
var length = 0;
|
2017-06-21 05:51:14 +00:00
|
|
|
var limit = Helper.config.prefetchMaxImageSize * 1024;
|
2014-12-23 01:06:11 +00:00
|
|
|
req
|
2015-09-30 22:39:57 +00:00
|
|
|
.on("response", function(res) {
|
2017-06-21 05:51:14 +00:00
|
|
|
if (!(/(image\/.+)/.test(res.headers["content-type"]))) {
|
|
|
|
// if not image, limit download to 10kb, since we need only meta tags
|
|
|
|
limit = 1024 * 10;
|
2014-12-23 01:06:11 +00:00
|
|
|
}
|
|
|
|
})
|
2015-09-30 22:39:57 +00:00
|
|
|
.on("error", function() {})
|
2014-12-23 01:06:11 +00:00
|
|
|
.pipe(es.map(function(data, next) {
|
|
|
|
length += data.length;
|
|
|
|
if (length > limit) {
|
|
|
|
req.response.req.abort();
|
|
|
|
}
|
|
|
|
next(null, data);
|
|
|
|
}))
|
|
|
|
.pipe(es.wait(function(err, data) {
|
2016-05-01 09:41:17 +00:00
|
|
|
if (err) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2017-06-21 05:51:14 +00:00
|
|
|
let type;
|
|
|
|
let size = parseInt(req.response.headers["content-length"], 10) || length;
|
|
|
|
|
|
|
|
if (size < length) {
|
|
|
|
size = length;
|
2014-12-23 01:06:11 +00:00
|
|
|
}
|
2017-06-21 05:51:14 +00:00
|
|
|
|
2015-01-03 09:03:43 +00:00
|
|
|
try {
|
2015-09-30 22:39:57 +00:00
|
|
|
type = req.response.headers["content-type"].split(/ *; */).shift();
|
|
|
|
} catch (e) {
|
2015-01-03 09:03:43 +00:00
|
|
|
type = {};
|
|
|
|
}
|
2014-12-23 01:06:11 +00:00
|
|
|
data = {
|
|
|
|
text: data,
|
2015-09-30 22:15:53 +00:00
|
|
|
type: type,
|
|
|
|
size: size
|
2014-12-23 01:06:11 +00:00
|
|
|
};
|
|
|
|
cb(data);
|
|
|
|
}));
|
2014-09-27 19:17:05 +00:00
|
|
|
}
|
2016-03-25 09:45:39 +00:00
|
|
|
|
|
|
|
// https://github.com/request/request/issues/2120
|
|
|
|
// https://github.com/nodejs/node/issues/1693
|
|
|
|
// https://github.com/alexeyten/descript/commit/50ee540b30188324198176e445330294922665fc
|
|
|
|
function escapeHeader(header) {
|
|
|
|
return header
|
|
|
|
.replace(/([\uD800-\uDBFF][\uDC00-\uDFFF])+/g, encodeURI)
|
|
|
|
.replace(/[\uD800-\uDFFF]/g, "")
|
|
|
|
.replace(/[\u0000-\u001F\u007F-\uFFFF]+/g, encodeURI);
|
|
|
|
}
|