Sharkey/packages/backend/src/core/DownloadService.ts

157 lines
4.2 KiB
TypeScript
Raw Normal View History

/*
2024-02-12 04:37:45 +02:00
* SPDX-FileCopyrightText: syuilo and misskey-project
* SPDX-License-Identifier: AGPL-3.0-only
*/
2022-09-17 21:27:08 +03:00
import * as fs from 'node:fs';
2023-07-27 03:04:19 +03:00
import * as stream from 'node:stream/promises';
2022-09-17 21:27:08 +03:00
import { Inject, Injectable } from '@nestjs/common';
import ipaddr from 'ipaddr.js';
2022-09-17 21:27:08 +03:00
import chalk from 'chalk';
import got, * as Got from 'got';
import { parse } from 'content-disposition';
2022-09-17 21:27:08 +03:00
import { DI } from '@/di-symbols.js';
2022-09-20 23:33:11 +03:00
import type { Config } from '@/config.js';
import { HttpRequestService } from '@/core/HttpRequestService.js';
2022-09-17 21:27:08 +03:00
import { createTemp } from '@/misc/create-temp.js';
import { StatusError } from '@/misc/status-error.js';
2022-09-18 17:07:41 +03:00
import { LoggerService } from '@/core/LoggerService.js';
import type Logger from '@/logger.js';
2022-09-17 21:27:08 +03:00
import { bindThis } from '@/decorators.js';
2022-09-17 21:27:08 +03:00
@Injectable()
export class DownloadService {
2022-09-18 21:11:50 +03:00
private logger: Logger;
2022-09-17 21:27:08 +03:00
constructor(
@Inject(DI.config)
private config: Config,
private httpRequestService: HttpRequestService,
2022-09-18 17:07:41 +03:00
private loggerService: LoggerService,
2022-09-17 21:27:08 +03:00
) {
2022-09-18 21:11:50 +03:00
this.logger = this.loggerService.getLogger('download');
2022-09-17 21:27:08 +03:00
}
@bindThis
public async downloadUrl(url: string, path: string): Promise<{
filename: string;
}> {
this.logger.info(`Downloading ${chalk.cyan(url)} to ${chalk.cyanBright(path)} ...`);
2022-09-17 21:27:08 +03:00
const timeout = 30 * 1000;
const operationTimeout = 60 * 1000;
const maxSize = this.config.maxFileSize ?? 262144000;
const urlObj = new URL(url);
let filename = urlObj.pathname.split('/').pop() ?? 'untitled';
const req = got.stream(url, {
headers: {
'User-Agent': this.config.userAgent,
},
timeout: {
lookup: timeout,
connect: timeout,
secureConnect: timeout,
socket: timeout, // read timeout
response: timeout,
send: timeout,
request: operationTimeout, // whole operation timeout
},
agent: {
http: this.httpRequestService.httpAgent,
https: this.httpRequestService.httpsAgent,
},
http2: false, // default
retry: {
limit: 0,
},
enableUnixSockets: false,
}).on('response', (res: Got.Response) => {
if ((process.env.NODE_ENV === 'production' || process.env.NODE_ENV === 'test') && !this.config.proxy && res.ip) {
if (this.isPrivateIp(res.ip)) {
this.logger.warn(`Blocked address: ${res.ip}`);
req.destroy();
}
}
const contentLength = res.headers['content-length'];
if (contentLength != null) {
const size = Number(contentLength);
if (size > maxSize) {
this.logger.warn(`maxSize exceeded (${size} > ${maxSize}) on response`);
req.destroy();
}
}
const contentDisposition = res.headers['content-disposition'];
if (contentDisposition != null) {
try {
const parsed = parse(contentDisposition);
if (parsed.parameters.filename) {
filename = parsed.parameters.filename;
}
} catch (e) {
this.logger.warn(`Failed to parse content-disposition: ${contentDisposition}`, { stack: e });
}
}
}).on('downloadProgress', (progress: Got.Progress) => {
if (progress.transferred > maxSize) {
this.logger.warn(`maxSize exceeded (${progress.transferred} > ${maxSize}) on downloadProgress`);
req.destroy();
}
});
try {
2023-07-27 03:04:19 +03:00
await stream.pipeline(req, fs.createWriteStream(path));
} catch (e) {
if (e instanceof Got.HTTPError) {
throw new StatusError(`${e.response.statusCode} ${e.response.statusMessage}`, e.response.statusCode, e.response.statusMessage);
} else {
throw e;
}
}
2022-09-18 21:11:50 +03:00
this.logger.succ(`Download finished: ${chalk.cyan(url)}`);
return {
filename,
};
2022-09-17 21:27:08 +03:00
}
@bindThis
2022-09-17 21:27:08 +03:00
public async downloadTextFile(url: string): Promise<string> {
// Create temp file
const [path, cleanup] = await createTemp();
2022-09-18 21:11:50 +03:00
this.logger.info(`text file: Temp file is ${path}`);
2022-09-17 21:27:08 +03:00
try {
// write content at URL to temp file
await this.downloadUrl(url, path);
2023-07-27 03:04:19 +03:00
const text = await fs.promises.readFile(path, 'utf8');
2022-09-17 21:27:08 +03:00
return text;
} finally {
cleanup();
}
}
@bindThis
2022-09-18 21:11:50 +03:00
private isPrivateIp(ip: string): boolean {
const parsedIp = ipaddr.parse(ip);
2022-09-17 21:27:08 +03:00
for (const net of this.config.allowedPrivateNetworks ?? []) {
const cidr = ipaddr.parseCIDR(net);
if (cidr[0].kind() === parsedIp.kind() && parsedIp.match(ipaddr.parseCIDR(net))) {
2022-09-17 21:27:08 +03:00
return false;
}
}
return parsedIp.range() !== 'unicast';
2022-09-17 21:27:08 +03:00
}
}