??改为|| 兼容node v12.13.1
This commit is contained in:
@@ -6,23 +6,6 @@ const sleepUtils = require('../../../utils/sleepUtils');
|
||||
|
||||
const dbUtils = global.dbUtils;
|
||||
|
||||
// 从数据库中查询
|
||||
async function getFromDatabase({ songId }) {
|
||||
// 查询出专辑
|
||||
let infoResultSet = await dbUtils.query('SELECT * FROM song WHERE song_id = ?', [songId]);
|
||||
if (infoResultSet.length == 0) return {};
|
||||
|
||||
// 查出专辑与歌曲对应关系
|
||||
let albumRelationResultSet = await dbUtils.query('SELECT * FROM song_album_relation WHERE song_id = ?', [songId]);
|
||||
let artistRelationResultSet = await dbUtils.query('SELECT * FROM song_artist_relation WHERE song_id = ?', [songId]);
|
||||
|
||||
// 拼装
|
||||
let songInfo = JSON.parse(JSON.stringify(infoResultSet[0]));
|
||||
songInfo.albumIds = albumRelationResultSet.map(album => album.album_id);
|
||||
songInfo.artistIds = artistRelationResultSet.map(artist => artist.artist_id);
|
||||
return songInfo;
|
||||
}
|
||||
|
||||
// 从数据库中查出还缺少的歌曲,并进行爬取
|
||||
async function fetchAll({ args = {} }) {
|
||||
console.log("start fetching songs ...");
|
||||
@@ -41,12 +24,18 @@ async function fetchAll({ args = {} }) {
|
||||
|
||||
var songIds = await dbUtils.query(sql, []);
|
||||
songIds = songIds.map(item => item.song_id);
|
||||
for (let i = 0; i < songIds.length; i++) {
|
||||
|
||||
// 0 - 100, 200 - 399, 400 - ..., ... - songIds.length-1
|
||||
// 0 1 2 count-1
|
||||
var step = 270;
|
||||
var total = songIds.length;
|
||||
var count = Math.ceil(total / step);
|
||||
for (let i = 0; i < count; i++) {
|
||||
await global.checkIsExit();
|
||||
const songId = songIds[i];
|
||||
console.log(`${i + 1}/${songIds.length} | song: ${songId} | ${args.min ?? "?"}-${args.max ?? "?"}`);
|
||||
var subArray = songIds.slice(i * step, (i + 1) * step);
|
||||
console.log(`${i + 1}/${count} | song: ${subArray[0]}-${subArray.slice(-1)[0]} | ${args.min || "?"}-${args.max || "?"}`);
|
||||
try {
|
||||
await fetch({ songId: songId });
|
||||
await fetch({ songIdArray: subArray });
|
||||
} catch (err) {
|
||||
console.error(err);
|
||||
}
|
||||
@@ -55,55 +44,26 @@ async function fetchAll({ args = {} }) {
|
||||
}
|
||||
|
||||
// 获取音乐详情
|
||||
async function fetch({ songId, debug = false }) {
|
||||
async function fetch({ songIdArray, debug = false }) {
|
||||
let result = await dbUtils.query('SELECT count(*) as count FROM song WHERE song_id = ?', [songId]);
|
||||
if (result[0].count > 0 && !debug) {
|
||||
console.log(`数据库中已有数据,跳过 songId: ${songId}`);
|
||||
return;
|
||||
}
|
||||
|
||||
let url = `https://music.163.com/song?id=${songId}`;
|
||||
// https://neteasecloudmusicapi-docs.4everland.app/#/?id=%e8%8e%b7%e5%8f%96%e6%ad%8c%e6%9b%b2%e8%af%a6%e6%83%85
|
||||
try {
|
||||
// var html = fs.readFileSync(path.join(__dirname, "../../temp", `song-${songId}.html`), 'utf8');
|
||||
var html = await requestUtils.getApiResult(url);
|
||||
// fs.writeFileSync(path.join(__dirname, "../../temp", `song-${songId}.html`), html);
|
||||
// 每一次大概可以取到270条以上
|
||||
var songResult = await song_detail({
|
||||
ids: ["64956", "64956"].join(','),
|
||||
});
|
||||
fs.writeFileSync(path.join(__dirname, "../../temp", `song-${playlistId}.json`), JSON.stringify(playlistResult));
|
||||
} catch (errors) {
|
||||
console.error(errors);
|
||||
return;
|
||||
}
|
||||
|
||||
if (html.includes(`<p class="note s-fc3">很抱歉,你要查找的网页找不到</p>`)) {
|
||||
let deleteResult1 = await dbUtils.query('DELETE FROM song_album_relation WHERE song_id = ?', [songId]);
|
||||
let deleteResult2 = await dbUtils.query('DELETE FROM song_artist_relation WHERE song_id = ?', [songId]);
|
||||
console.log(`song: ${songId} 不存在,从song_album_relation, song_artist_relation表中删除. affectedRows: ${deleteResult1.affectedRows}, ${deleteResult2.affectedRows}`);
|
||||
return;
|
||||
}
|
||||
|
||||
// 正则匹配
|
||||
let regExResult = /\<script type\=\"application\/ld\+json\"\>([\S\s]*?)\<\/script\>/.exec(html);
|
||||
let songInfoJSONString = regExResult[1];
|
||||
let songInfoDict = JSON.parse(songInfoJSONString);
|
||||
// console.log(songInfoDict);
|
||||
|
||||
// TODO 考虑歌曲别名 例如:https://music.163.com/#/song?id=26830207
|
||||
|
||||
let title = /<meta property="og:title" content="(.*?)" \/>/.exec(html)[1];
|
||||
let image = /<meta property="og:image" content="http:\/\/p.\.music\.126\.net\/(.*?)" \/>/.exec(html)[1];
|
||||
let artist = /<meta property="og:music:artist" content="(.*?)" \/>/.exec(html)[1];
|
||||
let duration = /<meta property="music:duration" content="(.*?)"\/>/.exec(html)[1];
|
||||
try {
|
||||
var album = /<meta property="og:music:album" content="(.*?)"\/>/.exec(html)[1];
|
||||
var albumId = /<meta property="music:album" content="https:\/\/music\.163\.com\/album\?id=(.*?)"\/>/.exec(html)[1];
|
||||
} catch (err) {
|
||||
// 歌曲不在专辑中
|
||||
}
|
||||
|
||||
const reg = /<meta property="music:musician" content="https:\/\/music\.163\.com\/artist\?id=(.*?)"\/>/g;
|
||||
let artistIds = [];
|
||||
let matched = null;
|
||||
while ((matched = reg.exec(html)) !== null) {
|
||||
artistIds.push(matched[1]);
|
||||
}
|
||||
console.log(playlistResult);
|
||||
|
||||
let songInfo = {
|
||||
songId: songId,
|
||||
@@ -138,7 +98,6 @@ async function fetch({ songId, debug = false }) {
|
||||
}
|
||||
|
||||
module.exports = {
|
||||
getFromDatabase: getFromDatabase,
|
||||
fetch: fetch,
|
||||
fetchAll: fetchAll,
|
||||
}
|
Reference in New Issue
Block a user