mirror of
https://github.com/misskey-dev/summaly.git
synced 2025-05-09 23:57:20 +09:00
116 lines
2.8 KiB
TypeScript
116 lines
2.8 KiB
TypeScript
import * as URL from 'url';
|
|
import * as request from 'request';
|
|
import nullOrEmpty from './utils/null-or-empty';
|
|
import clip from './utils/clip';
|
|
|
|
const escapeRegExp = require('escape-regexp');
|
|
|
|
const Entities = require('html-entities').AllHtmlEntities;
|
|
const entities = new Entities();
|
|
|
|
import * as client from 'cheerio-httpcli';
|
|
client.set('referer', false);
|
|
client.set('timeout', 10000);
|
|
|
|
import Summary from './summary';
|
|
|
|
export default async (url: URL.Url): Promise<Summary> => {
|
|
const res = await client.fetch(url.href);
|
|
|
|
if (res.error) {
|
|
throw 'something happened';
|
|
}
|
|
|
|
const contentType: string = res.response.headers['content-type'];
|
|
|
|
// HTMLじゃなかった場合は中止
|
|
if (contentType.indexOf('text/html') === -1) {
|
|
return null;
|
|
}
|
|
|
|
const $ = res.$;
|
|
|
|
let title =
|
|
$('meta[property="og:title"]').attr('content') ||
|
|
$('meta[property="twitter:title"]').attr('content') ||
|
|
$('title').text();
|
|
|
|
if (title === undefined || title === null) {
|
|
return null;
|
|
}
|
|
|
|
title = clip(entities.decode(title), 100);
|
|
|
|
let image =
|
|
$('meta[property="og:image"]').attr('content') ||
|
|
$('meta[property="twitter:image"]').attr('content') ||
|
|
$('link[rel="image_src"]').attr('href') ||
|
|
$('link[rel="apple-touch-icon"]').attr('href') ||
|
|
$('link[rel="apple-touch-icon image_src"]').attr('href');
|
|
|
|
image = image ? URL.resolve(url.href, image) : null;
|
|
|
|
let description =
|
|
$('meta[property="og:description"]').attr('content') ||
|
|
$('meta[property="twitter:description"]').attr('content') ||
|
|
$('meta[name="description"]').attr('content');
|
|
|
|
description = description
|
|
? clip(entities.decode(description), 300)
|
|
: null;
|
|
|
|
if (title === description) {
|
|
description = null;
|
|
}
|
|
|
|
let siteName =
|
|
$('meta[property="og:site_name"]').attr('content') ||
|
|
$('meta[name="application-name"]').attr('content') ||
|
|
url.hostname;
|
|
|
|
siteName = siteName ? entities.decode(siteName) : null;
|
|
|
|
let icon =
|
|
$('link[rel="shortcut icon"]').attr('href') ||
|
|
$('link[rel="icon"]').attr('href');
|
|
|
|
if (icon == null) {
|
|
const favicon = '/favicon.ico';
|
|
|
|
const foundFavicon = await new Promise(done => {
|
|
request.head(URL.resolve(url.href, favicon), (err, res) => {
|
|
if (err) {
|
|
done(false);
|
|
} else if (res.statusCode == 200) {
|
|
done(true);
|
|
} else {
|
|
done(false);
|
|
}
|
|
});
|
|
});
|
|
|
|
if (foundFavicon) {
|
|
icon = favicon;
|
|
}
|
|
}
|
|
|
|
icon = icon ? URL.resolve(url.href, icon) : null;
|
|
|
|
if (/[\-—\|:]$/.test(title.replace(new RegExp(`${escapeRegExp(siteName)}$`), '').trim())) {
|
|
title = title.replace(new RegExp(`${escapeRegExp(siteName)}$`), '').trim();
|
|
title = title.replace(/[\-—\|:]$/, '').trim();
|
|
}
|
|
|
|
if (title === '') {
|
|
title = siteName;
|
|
}
|
|
|
|
return {
|
|
title: title || null,
|
|
icon: icon || null,
|
|
description: description || null,
|
|
thumbnail: image || null,
|
|
sitename: siteName || null
|
|
};
|
|
};
|