2023-07-27 14:31:52 +09:00
|
|
|
/*
|
2024-02-14 00:59:27 +09:00
|
|
|
* SPDX-FileCopyrightText: syuilo and misskey-project
|
2023-07-27 14:31:52 +09:00
|
|
|
* SPDX-License-Identifier: AGPL-3.0-only
|
|
|
|
*/
|
|
|
|
|
2022-09-18 03:27:08 +09:00
|
|
|
import * as fs from 'node:fs';
|
2023-07-27 09:04:19 +09:00
|
|
|
import * as stream from 'node:stream/promises';
|
2022-09-18 03:27:08 +09:00
|
|
|
import { Inject, Injectable } from '@nestjs/common';
|
2023-06-25 06:35:09 +09:00
|
|
|
import ipaddr from 'ipaddr.js';
|
2022-09-18 03:27:08 +09:00
|
|
|
import chalk from 'chalk';
|
2023-01-25 12:00:04 +09:00
|
|
|
import got, * as Got from 'got';
|
2023-03-04 16:51:07 +09:00
|
|
|
import { parse } from 'content-disposition';
|
2022-09-18 03:27:08 +09:00
|
|
|
import { DI } from '@/di-symbols.js';
|
2022-09-21 05:33:11 +09:00
|
|
|
import type { Config } from '@/config.js';
|
2023-01-25 12:00:04 +09:00
|
|
|
import { HttpRequestService } from '@/core/HttpRequestService.js';
|
2022-09-18 03:27:08 +09:00
|
|
|
import { createTemp } from '@/misc/create-temp.js';
|
|
|
|
import { StatusError } from '@/misc/status-error.js';
|
2022-09-18 23:07:41 +09:00
|
|
|
import { LoggerService } from '@/core/LoggerService.js';
|
|
|
|
import type Logger from '@/logger.js';
|
2022-09-18 03:27:08 +09:00
|
|
|
|
2022-12-04 15:03:09 +09:00
|
|
|
import { bindThis } from '@/decorators.js';
|
2022-09-18 03:27:08 +09:00
|
|
|
|
|
|
|
@Injectable()
|
|
|
|
export class DownloadService {
|
2022-09-19 03:11:50 +09:00
|
|
|
private logger: Logger;
|
2022-09-18 03:27:08 +09:00
|
|
|
|
|
|
|
constructor(
|
|
|
|
@Inject(DI.config)
|
|
|
|
private config: Config,
|
|
|
|
|
|
|
|
private httpRequestService: HttpRequestService,
|
2022-09-18 23:07:41 +09:00
|
|
|
private loggerService: LoggerService,
|
2022-09-18 03:27:08 +09:00
|
|
|
) {
|
2022-09-19 03:11:50 +09:00
|
|
|
this.logger = this.loggerService.getLogger('download');
|
2022-09-18 03:27:08 +09:00
|
|
|
}
|
|
|
|
|
2022-12-04 15:03:09 +09:00
|
|
|
@bindThis
|
2023-03-04 16:51:07 +09:00
|
|
|
public async downloadUrl(url: string, path: string): Promise<{
|
|
|
|
filename: string;
|
|
|
|
}> {
|
2022-12-30 12:00:50 +09:00
|
|
|
this.logger.info(`Downloading ${chalk.cyan(url)} to ${chalk.cyanBright(path)} ...`);
|
2023-01-12 21:03:02 +09:00
|
|
|
|
2022-09-18 03:27:08 +09:00
|
|
|
const timeout = 30 * 1000;
|
|
|
|
const operationTimeout = 60 * 1000;
|
|
|
|
const maxSize = this.config.maxFileSize ?? 262144000;
|
2023-01-12 21:03:02 +09:00
|
|
|
|
2023-03-04 16:51:07 +09:00
|
|
|
const urlObj = new URL(url);
|
|
|
|
let filename = urlObj.pathname.split('/').pop() ?? 'untitled';
|
|
|
|
|
2023-01-25 12:00:04 +09:00
|
|
|
const req = got.stream(url, {
|
|
|
|
headers: {
|
|
|
|
'User-Agent': this.config.userAgent,
|
|
|
|
},
|
|
|
|
timeout: {
|
|
|
|
lookup: timeout,
|
|
|
|
connect: timeout,
|
|
|
|
secureConnect: timeout,
|
|
|
|
socket: timeout, // read timeout
|
|
|
|
response: timeout,
|
|
|
|
send: timeout,
|
|
|
|
request: operationTimeout, // whole operation timeout
|
|
|
|
},
|
|
|
|
agent: {
|
|
|
|
http: this.httpRequestService.httpAgent,
|
|
|
|
https: this.httpRequestService.httpsAgent,
|
|
|
|
},
|
|
|
|
http2: false, // default
|
|
|
|
retry: {
|
|
|
|
limit: 0,
|
|
|
|
},
|
2023-02-05 13:51:59 +09:00
|
|
|
enableUnixSockets: false,
|
2023-01-25 12:00:04 +09:00
|
|
|
}).on('response', (res: Got.Response) => {
|
|
|
|
if ((process.env.NODE_ENV === 'production' || process.env.NODE_ENV === 'test') && !this.config.proxy && res.ip) {
|
|
|
|
if (this.isPrivateIp(res.ip)) {
|
|
|
|
this.logger.warn(`Blocked address: ${res.ip}`);
|
|
|
|
req.destroy();
|
|
|
|
}
|
|
|
|
}
|
2023-01-12 21:03:02 +09:00
|
|
|
|
2023-01-25 12:00:04 +09:00
|
|
|
const contentLength = res.headers['content-length'];
|
|
|
|
if (contentLength != null) {
|
|
|
|
const size = Number(contentLength);
|
|
|
|
if (size > maxSize) {
|
|
|
|
this.logger.warn(`maxSize exceeded (${size} > ${maxSize}) on response`);
|
|
|
|
req.destroy();
|
|
|
|
}
|
|
|
|
}
|
2023-03-04 16:51:07 +09:00
|
|
|
|
|
|
|
const contentDisposition = res.headers['content-disposition'];
|
|
|
|
if (contentDisposition != null) {
|
2023-04-15 20:18:47 +09:00
|
|
|
try {
|
|
|
|
const parsed = parse(contentDisposition);
|
|
|
|
if (parsed.parameters.filename) {
|
|
|
|
filename = parsed.parameters.filename;
|
|
|
|
}
|
|
|
|
} catch (e) {
|
|
|
|
this.logger.warn(`Failed to parse content-disposition: ${contentDisposition}`, { stack: e });
|
2023-03-04 16:51:07 +09:00
|
|
|
}
|
|
|
|
}
|
2023-01-25 12:00:04 +09:00
|
|
|
}).on('downloadProgress', (progress: Got.Progress) => {
|
|
|
|
if (progress.transferred > maxSize) {
|
|
|
|
this.logger.warn(`maxSize exceeded (${progress.transferred} > ${maxSize}) on downloadProgress`);
|
|
|
|
req.destroy();
|
|
|
|
}
|
|
|
|
});
|
2023-01-12 21:03:02 +09:00
|
|
|
|
2023-01-25 12:00:04 +09:00
|
|
|
try {
|
2023-07-27 09:04:19 +09:00
|
|
|
await stream.pipeline(req, fs.createWriteStream(path));
|
2023-01-25 12:00:04 +09:00
|
|
|
} catch (e) {
|
|
|
|
if (e instanceof Got.HTTPError) {
|
|
|
|
throw new StatusError(`${e.response.statusCode} ${e.response.statusMessage}`, e.response.statusCode, e.response.statusMessage);
|
|
|
|
} else {
|
|
|
|
throw e;
|
|
|
|
}
|
|
|
|
}
|
2023-01-12 21:03:02 +09:00
|
|
|
|
2022-09-19 03:11:50 +09:00
|
|
|
this.logger.succ(`Download finished: ${chalk.cyan(url)}`);
|
2023-03-04 16:51:07 +09:00
|
|
|
|
|
|
|
return {
|
|
|
|
filename,
|
|
|
|
};
|
2022-09-18 03:27:08 +09:00
|
|
|
}
|
|
|
|
|
2022-12-04 15:03:09 +09:00
|
|
|
@bindThis
|
2022-09-18 03:27:08 +09:00
|
|
|
public async downloadTextFile(url: string): Promise<string> {
|
|
|
|
// Create temp file
|
|
|
|
const [path, cleanup] = await createTemp();
|
2023-06-25 06:35:09 +09:00
|
|
|
|
2022-09-19 03:11:50 +09:00
|
|
|
this.logger.info(`text file: Temp file is ${path}`);
|
2023-06-25 06:35:09 +09:00
|
|
|
|
2022-09-18 03:27:08 +09:00
|
|
|
try {
|
|
|
|
// write content at URL to temp file
|
|
|
|
await this.downloadUrl(url, path);
|
2023-06-25 06:35:09 +09:00
|
|
|
|
2023-07-27 09:04:19 +09:00
|
|
|
const text = await fs.promises.readFile(path, 'utf8');
|
2023-06-25 06:35:09 +09:00
|
|
|
|
2022-09-18 03:27:08 +09:00
|
|
|
return text;
|
|
|
|
} finally {
|
|
|
|
cleanup();
|
|
|
|
}
|
|
|
|
}
|
2023-01-12 21:03:02 +09:00
|
|
|
|
2022-12-04 15:03:09 +09:00
|
|
|
@bindThis
|
2022-09-19 03:11:50 +09:00
|
|
|
private isPrivateIp(ip: string): boolean {
|
2023-06-25 06:35:09 +09:00
|
|
|
const parsedIp = ipaddr.parse(ip);
|
|
|
|
|
2022-09-18 03:27:08 +09:00
|
|
|
for (const net of this.config.allowedPrivateNetworks ?? []) {
|
2024-01-14 15:57:26 +09:00
|
|
|
const cidr = ipaddr.parseCIDR(net);
|
|
|
|
if (cidr[0].kind() === parsedIp.kind() && parsedIp.match(ipaddr.parseCIDR(net))) {
|
2022-09-18 03:27:08 +09:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-06-25 06:35:09 +09:00
|
|
|
return parsedIp.range() !== 'unicast';
|
2022-09-18 03:27:08 +09:00
|
|
|
}
|
|
|
|
}
|