Merge pull request #1838 from thelounge/xpaw/ogp-media

Try to find og:video and og:audio on html pages
This commit is contained in:
Jérémie Astori 2018-03-07 19:22:30 -05:00 committed by GitHub
commit 589d7a9811
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 114 additions and 42 deletions

View File

@ -1449,6 +1449,11 @@ button.collapse-network:first-child:nth-last-child(3) {
max-width: 100%;
}
#chat video {
max-width: 640px;
max-height: 240px;
}
/* Do not display an empty div when there are no previews. Useful for example in
part/quit messages where we don't load previews (adds a blank line otherwise) */
#chat .preview:empty {

View File

@ -7,13 +7,13 @@
{{/equal}}
{{#equal type "audio"}}
<audio controls preload="metadata">
<source src="{{link}}" type="{{res}}">
<source src="{{media}}" type="{{mediaType}}">
Your browser does not support the audio element.
</audio>
{{/equal}}
{{#equal type "video"}}
<video width="320" height="240" preload="metadata" controls>
<source src="{{link}}" type="{{res}}">
<video preload="metadata" controls>
<source src="{{media}}" type="{{mediaType}}">
Your browser does not support the video element.
</video>
{{/equal}}

View File

@ -9,6 +9,9 @@ const cleanIrcMessage = require("../../../client/js/libs/handlebars/ircmessagepa
const findLinks = require("../../../client/js/libs/handlebars/ircmessageparser/findLinks");
const storage = require("../storage");
const mediaTypeRegex = /^(audio|video)\/.+/;
const linkRegex = /^https?:\/\//;
// Fix ECDH curve client compatibility in Node v8/v9
// This is fixed in Node 10, but The Lounge supports LTS versions
// https://github.com/nodejs/node/issues/16196
@ -30,7 +33,7 @@ module.exports = function(client, chan, msg) {
const cleanText = cleanIrcMessage(msg.text);
// We will only try to prefetch http(s) links
const links = findLinks(cleanText).filter((w) => /^https?:\/\//.test(w.link));
const links = findLinks(cleanText).filter((w) => linkRegex.test(w.link));
if (links.length === 0) {
return;
@ -65,10 +68,13 @@ module.exports = function(client, chan, msg) {
});
};
function parse(msg, preview, res, client) {
switch (res.type) {
case "text/html": {
function parseHtml(preview, res, client) {
return new Promise((resolve) => {
const $ = cheerio.load(res.data);
return parseHtmlMedia($, preview, res, client)
.then((newRes) => resolve(newRes))
.catch(() => {
preview.type = "link";
preview.head =
$('meta[property="og:title"]').attr("content")
@ -89,7 +95,7 @@ function parse(msg, preview, res, client) {
}
// Make sure thumbnail is a valid url
if (!/^https?:\/\//.test(preview.thumb)) {
if (!linkRegex.test(preview.thumb)) {
preview.thumb = "";
}
@ -102,15 +108,69 @@ function parse(msg, preview, res, client) {
preview.thumb = "";
}
handlePreview(client, msg, preview, resThumb);
resolve(resThumb);
});
} else {
resolve(res);
}
});
});
}
function parseHtmlMedia($, preview, res, client) {
return new Promise((resolve, reject) => {
let foundMedia = false;
["video", "audio"].forEach((type) => {
if (foundMedia) {
return;
}
break;
$(`meta[property="og:${type}:type"]`).each(function(i) {
const mimeType = $(this).attr("content");
if (mediaTypeRegex.test(mimeType)) {
// If we match a clean video or audio tag, parse that as a preview instead
const mediaUrl = $($(`meta[property="og:${type}"]`).get(i)).attr("content");
// Make sure media is a valid url
if (!mediaUrl.startsWith("https://")) {
return;
}
foundMedia = true;
fetch(escapeHeader(mediaUrl), {language: client.language}, (resMedia) => {
if (resMedia === null || !mediaTypeRegex.test(resMedia.type)) {
return reject();
}
preview.type = type;
preview.media = mediaUrl;
preview.mediaType = resMedia.type;
resolve(resMedia);
});
return false;
}
});
});
if (!foundMedia) {
reject();
}
});
}
function parse(msg, preview, res, client) {
let promise;
switch (res.type) {
case "text/html":
promise = parseHtml(preview, res, client);
break;
case "image/png":
case "image/gif":
case "image/jpg":
@ -141,7 +201,8 @@ function parse(msg, preview, res, client) {
}
preview.type = "audio";
preview.res = res.type;
preview.media = preview.link;
preview.mediaType = res.type;
break;
@ -152,8 +213,9 @@ function parse(msg, preview, res, client) {
break;
}
preview.res = res.type;
preview.type = "video";
preview.media = preview.link;
preview.mediaType = res.type;
break;
@ -161,7 +223,11 @@ function parse(msg, preview, res, client) {
return;
}
handlePreview(client, msg, preview, res);
if (!promise) {
return handlePreview(client, msg, preview, res);
}
promise.then((newRes) => handlePreview(client, msg, preview, newRes));
}
function handlePreview(client, msg, preview, res) {
@ -248,8 +314,9 @@ function fetch(uri, {language}, cb) {
if (contentLength > limit) {
req.abort();
}
} else if (/^(audio|video)\/.+/.test(res.headers["content-type"])) {
req.abort(); // ensure server doesn't download the audio file
} else if (mediaTypeRegex.test(res.headers["content-type"])) {
// We don't need to download the file any further after we received content-type header
req.abort();
} else {
// if not image, limit download to 50kb, since we need only meta tags
// twitter.com sends opengraph meta tags within ~20kb of data for individual tweets