mirror of
https://github.com/musix-org/musix-oss
synced 2024-12-23 16:13:18 +00:00
172 lines
5.4 KiB
JavaScript
172 lines
5.4 KiB
JavaScript
const qs = require('querystring');
|
|
const url = require('url');
|
|
const Entities = require('html-entities').AllHtmlEntities;
|
|
const util = require('./util');
|
|
const parseTime = require('m3u8stream/dist/parse-time');
|
|
|
|
|
|
|
|
const VIDEO_URL = 'https://www.youtube.com/watch?v=';
|
|
const getMetaItem = (body, name) => {
|
|
return util.between(body, `<meta itemprop="${name}" content="`, '">');
|
|
};
|
|
|
|
|
|
/**
|
|
* Get video description from html
|
|
*
|
|
* @param {string} html
|
|
* @return {string}
|
|
*/
|
|
exports.getVideoDescription = (html) => {
|
|
const regex = /<p.*?id="eow-description".*?>(.+?)<\/p>[\n\r\s]*?<\/div>/im;
|
|
const description = html.match(regex);
|
|
return description ?
|
|
Entities.decode(util.stripHTML(description[1])) : '';
|
|
};
|
|
|
|
/**
|
|
* Get video media (extra information) from html
|
|
*
|
|
* @param {string} body
|
|
* @return {Object}
|
|
*/
|
|
exports.getVideoMedia = (body) => {
|
|
let mediainfo = util.between(body,
|
|
'<div id="watch-description-extras">',
|
|
'<div id="watch-discussion" class="branded-page-box yt-card">');
|
|
if (mediainfo === '') {
|
|
return {};
|
|
}
|
|
|
|
const regexp = /<h4 class="title">([\s\S]*?)<\/h4>[\s\S]*?<ul .*?class=".*?watch-info-tag-list">[\s\S]*?<li>([\s\S]*?)<\/li>(?:\s*?<li>([\s\S]*?)<\/li>)?/g;
|
|
const contentRegexp = /(?: - (\d{4}) \()?<a .*?(?:href="([^"]+)")?.*?>(.*?)<\/a>/;
|
|
const imgRegexp = /<img src="([^"]+)".*?>/;
|
|
const media = {};
|
|
|
|
const image = imgRegexp.exec(mediainfo);
|
|
if (image) {
|
|
media.image = url.resolve(VIDEO_URL, image[1]);
|
|
}
|
|
|
|
let match;
|
|
while ((match = regexp.exec(mediainfo)) != null) {
|
|
let [, key, value, detail] = match;
|
|
key = Entities.decode(key).trim().replace(/\s/g, '_').toLowerCase();
|
|
const content = contentRegexp.exec(value);
|
|
if (content) {
|
|
let [, year, mediaUrl, value2] = content;
|
|
if (year) {
|
|
media.year = parseInt(year);
|
|
} else if (detail) {
|
|
media.year = parseInt(detail);
|
|
}
|
|
value = value.slice(0, content.index);
|
|
if (key !== 'game' || value2 !== 'YouTube Gaming') {
|
|
value += value2;
|
|
}
|
|
media[key + '_url'] = url.resolve(VIDEO_URL, mediaUrl);
|
|
}
|
|
media[key] = Entities.decode(value);
|
|
}
|
|
return media;
|
|
};
|
|
|
|
/**
|
|
* Get video Owner from html.
|
|
*
|
|
* @param {string} body
|
|
* @return {Object}
|
|
*/
|
|
const userRegexp = /<a href="\/user\/([^"]+)/;
|
|
const verifiedRegexp = /<span .*?(aria-label="Verified")(.*?(?=<\/span>))/;
|
|
exports.getAuthor = (body) => {
|
|
let ownerinfo = util.between(body,
|
|
'<div id="watch7-user-header" class=" spf-link ">',
|
|
'<div id="watch8-action-buttons" class="watch-action-buttons clearfix">');
|
|
if (ownerinfo === '') {
|
|
return {};
|
|
}
|
|
const channelName = Entities.decode(util.between(util.between(
|
|
ownerinfo, '<div class="yt-user-info">', '</div>'), '>', '</a>'));
|
|
const userMatch = ownerinfo.match(userRegexp);
|
|
const verifiedMatch = ownerinfo.match(verifiedRegexp);
|
|
const channelID = getMetaItem(body, 'channelId');
|
|
const username = userMatch ? userMatch[1] : util.between(
|
|
util.between(body, '<span itemprop="author"', '</span>'), '/user/', '">');
|
|
return {
|
|
id: channelID,
|
|
name: channelName,
|
|
avatar: url.resolve(VIDEO_URL, util.between(ownerinfo,
|
|
'data-thumb="', '"')),
|
|
verified: !!verifiedMatch,
|
|
user: username,
|
|
channel_url: 'https://www.youtube.com/channel/' + channelID,
|
|
user_url: 'https://www.youtube.com/user/' + username,
|
|
};
|
|
};
|
|
|
|
|
|
/**
|
|
* Get video published at from html.
|
|
*
|
|
* @param {string} body
|
|
* @return {string}
|
|
*/
|
|
exports.getPublished = (body) => {
|
|
return Date.parse(getMetaItem(body, 'datePublished'));
|
|
};
|
|
|
|
|
|
/**
|
|
* Get video published at from html.
|
|
* Credits to https://github.com/paixaop.
|
|
*
|
|
* @param {string} body
|
|
* @return {Array.<Object>}
|
|
*/
|
|
exports.getRelatedVideos = (body) => {
|
|
let jsonStr = util.between(body, '\'RELATED_PLAYER_ARGS\': ', ',\n');
|
|
let watchNextJson, rvsParams, secondaryResults;
|
|
try {
|
|
jsonStr = JSON.parse(jsonStr);
|
|
watchNextJson = JSON.parse(jsonStr.watch_next_response);
|
|
rvsParams = jsonStr.rvs.split(',').map((e) => qs.parse(e));
|
|
secondaryResults = watchNextJson.contents.twoColumnWatchNextResults.secondaryResults.secondaryResults.results;
|
|
}
|
|
catch (err) {
|
|
return [];
|
|
}
|
|
let videos = [];
|
|
for (let result of secondaryResults) {
|
|
let details = result.compactVideoRenderer;
|
|
if (details) {
|
|
try {
|
|
let viewCount = details.viewCountText.simpleText;
|
|
let shortViewCount = details.shortViewCountText.simpleText;
|
|
let rvsDetails = rvsParams.find((elem) => elem.id === details.videoId);
|
|
if (!/^\d/.test(shortViewCount)) {
|
|
shortViewCount = rvsDetails && rvsDetails.short_view_count_text || '';
|
|
}
|
|
viewCount = (/^\d/.test(viewCount) ? viewCount : shortViewCount).split(' ')[0];
|
|
videos.push({
|
|
id: details.videoId,
|
|
title: details.title.simpleText,
|
|
author: details.shortBylineText.runs[0].text,
|
|
ucid: details.shortBylineText.runs[0].navigationEndpoint.browseEndpoint.browseId,
|
|
author_thumbnail: details.channelThumbnail.thumbnails[0].url,
|
|
short_view_count_text: shortViewCount.split(' ')[0],
|
|
view_count: viewCount.replace(',', ''),
|
|
length_seconds: details.lengthText ?
|
|
Math.floor(parseTime.humanStr(details.lengthText.simpleText) / 1000) :
|
|
rvsParams && rvsParams.length_seconds + '',
|
|
video_thumbnail: details.thumbnail.thumbnails[0].url,
|
|
});
|
|
} catch (err) {
|
|
continue;
|
|
}
|
|
}
|
|
}
|
|
return videos;
|
|
};
|