2023-07-16 05:02:00 +02:00
|
|
|
import * as fs from "node:fs";
|
|
|
|
import Logger from "@/services/logger.js";
|
|
|
|
import { createTemp, createTempDir } from "./create-temp.js";
|
|
|
|
import { downloadUrl } from "./download-url.js";
|
|
|
|
import { addFile } from "@/services/drive/add-file.js";
|
|
|
|
import { Users } from "@/models/index.js";
|
2023-07-16 07:47:06 +02:00
|
|
|
import * as tar from "tar-stream";
|
2023-07-16 07:41:57 +02:00
|
|
|
import gunzip from "gunzip-maybe";
|
2023-07-16 05:02:00 +02:00
|
|
|
|
2023-07-16 07:41:57 +02:00
|
|
|
const logger = new Logger("process-masto-notes");
|
2023-07-16 05:02:00 +02:00
|
|
|
|
|
|
|
export async function processMastoNotes(
|
|
|
|
url: string,
|
|
|
|
uid: string,
|
|
|
|
): Promise<any> {
|
|
|
|
// Create temp file
|
|
|
|
const [path, cleanup] = await createTemp();
|
|
|
|
|
|
|
|
const [unzipPath, unzipCleanup] = await createTempDir();
|
|
|
|
|
|
|
|
logger.info(`Temp file is ${path}`);
|
|
|
|
|
|
|
|
try {
|
|
|
|
// write content at URL to temp file
|
|
|
|
await downloadUrl(url, path);
|
|
|
|
return await processMastoFile(path, unzipPath, uid);
|
|
|
|
} finally {
|
|
|
|
cleanup();
|
|
|
|
unzipCleanup();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
function processMastoFile(fn: string, dir: string, uid: string) {
|
|
|
|
return new Promise(async (resolve, reject) => {
|
|
|
|
const user = await Users.findOneBy({ id: uid });
|
2023-07-16 07:47:06 +02:00
|
|
|
try {
|
2023-07-16 07:41:57 +02:00
|
|
|
logger.info(`Start unzip ${fn}`);
|
|
|
|
await unzipTarGz(fn, dir);
|
|
|
|
logger.info(`Unzip to ${dir}`);
|
|
|
|
const outbox = JSON.parse(fs.readFileSync(`${dir}/outbox.json`));
|
|
|
|
for (const note of outbox.orderedItems) {
|
|
|
|
for (const attachment of note.object.attachment) {
|
|
|
|
const url = attachment.url.replace("..", "");
|
|
|
|
try {
|
|
|
|
const fpath = `${dir}${url}`;
|
|
|
|
const driveFile = await addFile({ user: user, path: fpath });
|
|
|
|
attachment.driveFile = driveFile;
|
|
|
|
} catch (e) {
|
|
|
|
logger.error(`Skipped adding file to drive: ${url}`);
|
2023-07-16 05:02:00 +02:00
|
|
|
}
|
|
|
|
}
|
2023-07-16 07:41:57 +02:00
|
|
|
}
|
|
|
|
resolve(outbox);
|
2023-07-16 07:47:06 +02:00
|
|
|
} catch (e) {
|
2023-07-16 07:41:57 +02:00
|
|
|
logger.error(`Error on extract masto note package: ${fn}`);
|
|
|
|
reject(e);
|
|
|
|
}
|
2023-07-16 05:02:00 +02:00
|
|
|
});
|
|
|
|
}
|
2023-07-16 07:41:57 +02:00
|
|
|
|
2023-07-16 07:47:06 +02:00
|
|
|
function createFileDir(fn: string) {
|
|
|
|
if (!fs.existsSync(fn)) {
|
|
|
|
fs.mkdirSync(fn, { recursive: true });
|
2023-07-16 07:41:57 +02:00
|
|
|
fs.rmdirSync(fn);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-16 07:47:06 +02:00
|
|
|
function unzipTarGz(fn: string, dir: string) {
|
2023-07-16 07:41:57 +02:00
|
|
|
return new Promise(async (resolve, reject) => {
|
|
|
|
const onErr = (err: any) => {
|
|
|
|
logger.error(`pipe broken: ${err}`);
|
|
|
|
reject();
|
2023-07-16 07:47:06 +02:00
|
|
|
};
|
|
|
|
try {
|
|
|
|
const extract = tar.extract().on("error", onErr);
|
2023-07-16 07:41:57 +02:00
|
|
|
dir = dir.endsWith("/") ? dir : dir + "/";
|
|
|
|
const ls: string[] = [];
|
2023-07-16 07:47:06 +02:00
|
|
|
extract.on("entry", function (header: any, stream: any, next: any) {
|
|
|
|
try {
|
2023-07-16 07:41:57 +02:00
|
|
|
ls.push(dir + header.name);
|
|
|
|
createFileDir(dir + header.name);
|
2023-07-16 07:47:06 +02:00
|
|
|
stream
|
|
|
|
.on("error", onErr)
|
|
|
|
.pipe(fs.createWriteStream(dir + header.name))
|
|
|
|
.on("error", onErr);
|
2023-07-16 07:41:57 +02:00
|
|
|
next();
|
2023-07-16 07:47:06 +02:00
|
|
|
} catch (e) {
|
2023-07-16 07:41:57 +02:00
|
|
|
logger.error(`create dir error:${e}`);
|
|
|
|
reject();
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
2023-07-16 07:47:06 +02:00
|
|
|
extract.on("finish", function () {
|
|
|
|
resolve(ls);
|
2023-07-16 07:41:57 +02:00
|
|
|
});
|
2023-07-16 07:47:06 +02:00
|
|
|
|
|
|
|
fs.createReadStream(fn)
|
|
|
|
.on("error", onErr)
|
|
|
|
.pipe(gunzip())
|
|
|
|
.on("error", onErr)
|
|
|
|
.pipe(extract)
|
|
|
|
.on("error", onErr);
|
|
|
|
} catch (e) {
|
2023-07-16 07:41:57 +02:00
|
|
|
logger.error(`unzipTarGz error: ${e}`);
|
|
|
|
reject();
|
|
|
|
}
|
|
|
|
});
|
2023-07-16 07:47:06 +02:00
|
|
|
}
|