240 lines
7.4 KiB
JavaScript
240 lines
7.4 KiB
JavaScript
|
var https = require('follow-redirects').https;
|
|||
|
var fs = require('fs');
|
|||
|
const path = require('path');
|
|||
|
|
|||
|
const base64Utils = require('../utils/base64Utils')
|
|||
|
|
|||
|
const { token, userId } = require('./config')
|
|||
|
|
|||
|
const outputDir = './output/' // 以 / 结尾
|
|||
|
const courseDetailDir = 'courseDetail/' // 以 / 结尾
|
|||
|
const downloadMediaDir = 'downloadMedia/' // 以 / 结尾
|
|||
|
|
|||
|
main()
|
|||
|
|
|||
|
async function main() {
|
|||
|
// /**
|
|||
|
// * Step 1 课程列表
|
|||
|
// */
|
|||
|
await getCourseList(1594)
|
|||
|
|
|||
|
// /**
|
|||
|
// * Step 2 课程详情
|
|||
|
// */
|
|||
|
let courseListJson = fs.readFileSync(outputDir + 'courseList.json', 'utf8')
|
|||
|
let courseList = JSON.parse(courseListJson).data.childs
|
|||
|
await getCourseDetail(courseList)
|
|||
|
|
|||
|
/**
|
|||
|
* Step 3 解析数据
|
|||
|
*/
|
|||
|
await parseCourseDetailJson()
|
|||
|
|
|||
|
/**
|
|||
|
* Step 3 下载音频,保存课件
|
|||
|
*/
|
|||
|
await downloadMedia()
|
|||
|
|
|||
|
console.log('完成')
|
|||
|
}
|
|||
|
|
|||
|
async function getCourseList(courseId) {
|
|||
|
var options = {
|
|||
|
'method': 'POST',
|
|||
|
'hostname': 'wx.hxdkfp.com',
|
|||
|
'path': '/czw-api/api-hypt-product/hypt/product/getProductInfo?id=' + courseId + '&serviceType=3&userId=' + userId,
|
|||
|
'headers': {
|
|||
|
'token': token
|
|||
|
},
|
|||
|
// 'maxRedirects': 20,
|
|||
|
'rejectUnauthorized': false
|
|||
|
};
|
|||
|
await httpsRequest(options, outputDir + 'courseList.json')
|
|||
|
}
|
|||
|
|
|||
|
async function getCourseDetail(courseList) {
|
|||
|
// console.log(courseList)
|
|||
|
for (let i = 0; i < courseList.length; i++) {
|
|||
|
const courseDetail = courseList[i]
|
|||
|
/*
|
|||
|
{
|
|||
|
id: 2662,
|
|||
|
serviceType: '1',
|
|||
|
imgUrl: 'e41f693bbfe4442d8c611633644802fc.jpg',
|
|||
|
publishTime: '2023-09-11 00:00:00',
|
|||
|
serviceName: '【第559期】关于耕地占用税的那些事儿',
|
|||
|
serviceOrder: 1,
|
|||
|
serviceStatus: '0',
|
|||
|
isCard: '0',
|
|||
|
isFree: '1',
|
|||
|
realPrice: '5',
|
|||
|
labelNum: '1',
|
|||
|
labelName: '音频',
|
|||
|
verificationCodeFlag: false,
|
|||
|
serviceStatusName: '上架',
|
|||
|
downButtonFlag: true,
|
|||
|
agreementString: ''
|
|||
|
},
|
|||
|
*/
|
|||
|
const courseDetailId = courseDetail.id
|
|||
|
const courseDetailName = courseDetail.serviceName
|
|||
|
console.log(`${i}\t| ${courseDetailId} | ${courseDetailName}`)
|
|||
|
try {
|
|||
|
let options = {
|
|||
|
'method': 'POST',
|
|||
|
'hostname': 'wx.hxdkfp.com',
|
|||
|
'path': '/czw-api/api-hypt-product/hypt/product/getProductInfo?id=' + courseDetailId + '&serviceType=1&userId=' + userId,
|
|||
|
'headers': {
|
|||
|
'token': token
|
|||
|
},
|
|||
|
// 'maxRedirects': 20,
|
|||
|
'rejectUnauthorized': false
|
|||
|
};
|
|||
|
await httpsRequest(options, outputDir + courseDetailDir + courseDetailId + '.json')
|
|||
|
console.log('\t完成')
|
|||
|
|
|||
|
await waitAMinute()
|
|||
|
} catch (err) {
|
|||
|
console.error(err)
|
|||
|
}
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
async function parseCourseDetailJson() {
|
|||
|
const dirPath = outputDir + courseDetailDir
|
|||
|
var infoDir = [
|
|||
|
// {
|
|||
|
// name: '',
|
|||
|
// audioUrl: '',
|
|||
|
// publishTime: '',
|
|||
|
// brief: '',
|
|||
|
// detail: '',
|
|||
|
// }
|
|||
|
]
|
|||
|
// 读取目录下的所有文件名
|
|||
|
const files = fs.readdirSync(dirPath);
|
|||
|
for (let file of files) {
|
|||
|
// 拼接文件的完整路径
|
|||
|
const filePath = path.join(dirPath, file);
|
|||
|
// 读取文件的内容
|
|||
|
let fileContent = fs.readFileSync(filePath, 'utf8');
|
|||
|
const jsonObj = JSON.parse(fileContent);
|
|||
|
const data = jsonObj.data
|
|||
|
const brief = base64Utils.base64_decode(data.briefString)
|
|||
|
const detail = base64Utils.base64_decode(data.detailString)
|
|||
|
const filename = deleteFilenameUnsupportChar(data.serviceName)
|
|||
|
// 打印文件名和文件内容
|
|||
|
console.log(file);
|
|||
|
infoDir.push({
|
|||
|
name: filename,
|
|||
|
audioUrl: data.audioUrl,
|
|||
|
// publishTime: data.publishTime,
|
|||
|
// brief: brief,
|
|||
|
// detail: detail,
|
|||
|
})
|
|||
|
fs.writeFileSync(outputDir + downloadMediaDir + filename + '-简介.html', brief, 'utf8')
|
|||
|
fs.writeFileSync(outputDir + downloadMediaDir + filename + '-详情.html', detail, 'utf8')
|
|||
|
}
|
|||
|
fs.writeFileSync(outputDir + 'parsedCourseDetails.json', JSON.stringify(infoDir, null, 4), 'utf8')
|
|||
|
}
|
|||
|
|
|||
|
async function downloadMedia() {
|
|||
|
const parsedCourseDetails = JSON.parse(fs.readFileSync(outputDir + 'parsedCourseDetails.json', 'utf8'))
|
|||
|
for (let i = 0; i < parsedCourseDetails.length; i++) {
|
|||
|
const item = parsedCourseDetails[i]
|
|||
|
const audioUrl = item.audioUrl
|
|||
|
const filename = item.name
|
|||
|
const fileNameWithExt = audioUrl.lastIndexOf('.') != -1
|
|||
|
? filename + audioUrl.substring(audioUrl.lastIndexOf('.'))
|
|||
|
: filename
|
|||
|
console.log(`${i}\t| ${fileNameWithExt} | ${item.audioUrl}`)
|
|||
|
try {
|
|||
|
await downloadFile(audioUrl, outputDir + downloadMediaDir + fileNameWithExt)
|
|||
|
} catch (err) {
|
|||
|
console.error(err)
|
|||
|
}
|
|||
|
await waitAMinute()
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
|
|||
|
// 公共请求方法
|
|||
|
async function httpsRequest(options, fileneme) {
|
|||
|
return await new Promise((resolve) => {
|
|||
|
|
|||
|
var req = https.request(options, function (res) {
|
|||
|
var chunks = [];
|
|||
|
|
|||
|
res.on("data", function (chunk) {
|
|||
|
chunks.push(chunk);
|
|||
|
});
|
|||
|
|
|||
|
res.on("end", function (chunk) {
|
|||
|
var body = Buffer.concat(chunks);
|
|||
|
var result = body.toString()
|
|||
|
// console.log(result);
|
|||
|
fs.writeFileSync(fileneme, result, 'utf8')
|
|||
|
resolve(result)
|
|||
|
});
|
|||
|
|
|||
|
res.on("error", function (error) {
|
|||
|
console.error(error);
|
|||
|
});
|
|||
|
});
|
|||
|
|
|||
|
req.end();
|
|||
|
})
|
|||
|
}
|
|||
|
|
|||
|
async function waitAMinute() {
|
|||
|
return await new Promise((resolve) => {
|
|||
|
setTimeout(resolve, 100)
|
|||
|
})
|
|||
|
}
|
|||
|
|
|||
|
function deleteFilenameUnsupportChar(name) {
|
|||
|
return name
|
|||
|
.replace(/\?/g, "?")
|
|||
|
.replace(/\:/g, ":")
|
|||
|
.replace(/\t/g, " ")
|
|||
|
.replace(/"/g, "''")
|
|||
|
}
|
|||
|
|
|||
|
/**
|
|||
|
*
|
|||
|
* @param {*} fileUrl 要下载的文件的 url
|
|||
|
* @param {*} downloadPath 要保存的文件的路径
|
|||
|
*/
|
|||
|
async function downloadFile(fileUrl, downloadPath) {
|
|||
|
return await new Promise((resolve, reject) => {
|
|||
|
// 创建一个可写的文件流
|
|||
|
const file = fs.createWriteStream(downloadPath);
|
|||
|
|
|||
|
// 发起 https 请求,获取响应流
|
|||
|
const request = https.request(fileUrl, response => {
|
|||
|
// 将响应流写入文件流
|
|||
|
response.pipe(file);
|
|||
|
// 监听文件流的 finish 事件,表示下载完成
|
|||
|
file.on("finish", () => {
|
|||
|
// 关闭文件流
|
|||
|
file.close();
|
|||
|
// 打印下载成功的消息
|
|||
|
console.log("\t文件下载完毕");
|
|||
|
resolve()
|
|||
|
});
|
|||
|
});
|
|||
|
|
|||
|
// 监听请求的 error 事件,表示下载失败
|
|||
|
request.on("error", err => {
|
|||
|
// 删除已下载的文件
|
|||
|
fs.unlink(downloadPath, () => {
|
|||
|
// 打印下载失败的消息
|
|||
|
console.error(`\t下载失败: ${err.message}`);
|
|||
|
reject()
|
|||
|
});
|
|||
|
});
|
|||
|
|
|||
|
// 结束请求
|
|||
|
request.end();
|
|||
|
})
|
|||
|
}
|