trending-in-one/weibo-search.ts

61 lines
1.7 KiB
TypeScript
Raw Normal View History

2020-11-29 03:11:35 +08:00
#!/usr/bin/env -S deno run --unstable --allow-net --allow-read --allow-write --import-map=import_map.json
// Copyright 2020 justjavac(迷渡). All rights reserved. MIT license.
import { format } from "std/datetime/mod.ts";
import { join } from "std/path/mod.ts";
import { exists } from "std/fs/mod.ts";
import type { Word } from "./types.ts";
2020-11-29 13:03:19 +08:00
import {
createArchive4Weibo,
createReadme4Weibo,
mergeWords4Weibo,
} from "./utils.ts";
2020-11-29 03:11:35 +08:00
const regexp = /<a href="(\/weibo\?q=[^"]+)".*?>(.+)<\/a>/g;
const response = await fetch("https://s.weibo.com/top/summary");
if (!response.ok) {
console.error(response.statusText);
Deno.exit(-1);
}
const result: string = await response.text();
const matches = result.matchAll(regexp);
const words: Word[] = Array.from(matches).map((x) => ({
url: x[1],
title: x[2],
}));
const yyyyMMdd = format(new Date(), "yyyy-MM-dd");
const fullPath = join("raw/weibo-search", `${yyyyMMdd}.json`);
let wordsAlreadyDownload: Word[] = [];
if (await exists(fullPath)) {
const content = await Deno.readTextFile(fullPath);
wordsAlreadyDownload = JSON.parse(content);
}
const queswordsAll = mergeWords4Weibo(words, wordsAlreadyDownload);
2020-11-29 13:03:19 +08:00
export const weiboSearchData = queswordsAll.map((x) => {
2020-11-29 03:11:35 +08:00
x.realurl = `https://s.weibo.com/${x.url}`;
return x;
});
export async function weiboSearch() {
// 保存原始数据
await Deno.writeTextFile(fullPath, JSON.stringify(queswordsAll));
// 更新 README.md
const readme = await createReadme4Weibo(queswordsAll);
await Deno.writeTextFile("./README.md", readme);
// 更新 archives
const archiveText = createArchive4Weibo(queswordsAll, yyyyMMdd);
const archivePath = join("archives/weibo-search", `${yyyyMMdd}.md`);
await Deno.writeTextFile(archivePath, archiveText);
}