2018-11-21 05:11:00 +09:00
|
|
|
|
import * as P from 'parsimmon';
|
2019-03-14 21:23:15 +09:00
|
|
|
|
import { createLeaf, createTree, urlRegex } from './prelude';
|
2019-01-31 12:06:13 +09:00
|
|
|
|
import { takeWhile, cumulativeSum } from '../prelude/array';
|
2018-11-21 05:11:00 +09:00
|
|
|
|
import parseAcct from '../misc/acct/parse';
|
|
|
|
|
import { toUnicode } from 'punycode';
|
2019-03-18 00:03:57 +09:00
|
|
|
|
import { emojiRegex } from '../misc/emoji-regex';
|
2018-11-21 05:11:00 +09:00
|
|
|
|
|
2018-12-22 00:41:54 +09:00
|
|
|
|
export function removeOrphanedBrackets(s: string): string {
|
2019-07-02 20:05:52 +09:00
|
|
|
|
const openBrackets = ['(', '「', '['];
|
|
|
|
|
const closeBrackets = [')', '」', ']'];
|
2018-12-22 00:41:54 +09:00
|
|
|
|
const xs = cumulativeSum(s.split('').map(c => {
|
|
|
|
|
if (openBrackets.includes(c)) return 1;
|
|
|
|
|
if (closeBrackets.includes(c)) return -1;
|
|
|
|
|
return 0;
|
|
|
|
|
}));
|
|
|
|
|
const firstOrphanedCloseBracket = xs.findIndex(x => x < 0);
|
|
|
|
|
if (firstOrphanedCloseBracket !== -1) return s.substr(0, firstOrphanedCloseBracket);
|
|
|
|
|
const lastMatched = xs.lastIndexOf(0);
|
|
|
|
|
return s.substr(0, lastMatched + 1);
|
2018-11-25 13:19:33 +09:00
|
|
|
|
}
|
|
|
|
|
|
2019-01-30 16:56:27 +09:00
|
|
|
|
export const mfmLanguage = P.createLanguage({
|
2019-01-31 12:06:13 +09:00
|
|
|
|
root: r => P.alt(r.block, r.inline).atLeast(1),
|
|
|
|
|
plain: r => P.alt(r.emoji, r.text).atLeast(1),
|
|
|
|
|
block: r => P.alt(
|
|
|
|
|
r.quote,
|
|
|
|
|
r.search,
|
2019-01-31 12:10:48 +09:00
|
|
|
|
r.blockCode,
|
|
|
|
|
r.mathBlock,
|
|
|
|
|
r.center,
|
2019-01-31 12:06:13 +09:00
|
|
|
|
),
|
|
|
|
|
startOfLine: () => P((input, i) => {
|
2020-04-04 08:46:54 +09:00
|
|
|
|
if (i === 0 || input[i] === '\n' || input[i - 1] === '\n') {
|
2019-01-31 12:06:13 +09:00
|
|
|
|
return P.makeSuccess(i, null);
|
|
|
|
|
} else {
|
|
|
|
|
return P.makeFailure(i, 'not newline');
|
|
|
|
|
}
|
|
|
|
|
}),
|
|
|
|
|
quote: r => r.startOfLine.then(P((input, i) => {
|
|
|
|
|
const text = input.substr(i);
|
|
|
|
|
if (!text.match(/^>[\s\S]+?/)) return P.makeFailure(i, 'not a quote');
|
|
|
|
|
const quote = takeWhile(line => line.startsWith('>'), text.split('\n'));
|
|
|
|
|
const qInner = quote.join('\n').replace(/^>/gm, '').replace(/^ /gm, '');
|
2020-04-04 08:46:54 +09:00
|
|
|
|
if (qInner === '') return P.makeFailure(i, 'not a quote');
|
2019-01-31 12:06:13 +09:00
|
|
|
|
const contents = r.root.tryParse(qInner);
|
|
|
|
|
return P.makeSuccess(i + quote.join('\n').length + 1, createTree('quote', contents, {}));
|
|
|
|
|
})),
|
|
|
|
|
search: r => r.startOfLine.then(P((input, i) => {
|
|
|
|
|
const text = input.substr(i);
|
|
|
|
|
const match = text.match(/^(.+?)( | )(検索|\[検索\]|Search|\[Search\])(\n|$)/i);
|
|
|
|
|
if (!match) return P.makeFailure(i, 'not a search');
|
|
|
|
|
return P.makeSuccess(i + match[0].length, createLeaf('search', { query: match[1], content: match[0].trim() }));
|
|
|
|
|
})),
|
|
|
|
|
blockCode: r => r.startOfLine.then(P((input, i) => {
|
|
|
|
|
const text = input.substr(i);
|
|
|
|
|
const match = text.match(/^```(.+?)?\n([\s\S]+?)\n```(\n|$)/i);
|
|
|
|
|
if (!match) return P.makeFailure(i, 'not a blockCode');
|
|
|
|
|
return P.makeSuccess(i + match[0].length, createLeaf('blockCode', { code: match[2], lang: match[1] ? match[1].trim() : null }));
|
|
|
|
|
})),
|
|
|
|
|
inline: r => P.alt(
|
2020-11-08 16:35:22 +09:00
|
|
|
|
r.big,
|
2018-11-21 05:11:00 +09:00
|
|
|
|
r.bold,
|
2019-01-31 12:06:13 +09:00
|
|
|
|
r.small,
|
2018-12-05 17:39:26 +09:00
|
|
|
|
r.italic,
|
2019-01-31 12:06:13 +09:00
|
|
|
|
r.strike,
|
2018-11-21 05:11:00 +09:00
|
|
|
|
r.inlineCode,
|
2019-01-31 12:06:13 +09:00
|
|
|
|
r.mathInline,
|
|
|
|
|
r.mention,
|
|
|
|
|
r.hashtag,
|
|
|
|
|
r.url,
|
|
|
|
|
r.link,
|
2019-01-30 15:12:48 +09:00
|
|
|
|
r.emoji,
|
2020-11-07 23:41:21 +09:00
|
|
|
|
r.fn,
|
2019-01-30 15:12:48 +09:00
|
|
|
|
r.text
|
2019-01-31 12:06:13 +09:00
|
|
|
|
),
|
2020-11-08 16:35:22 +09:00
|
|
|
|
// TODO: そのうち消す
|
|
|
|
|
big: r => P.regexp(/^\*\*\*([\s\S]+?)\*\*\*/, 1).map(x => createTree('fn', r.inline.atLeast(1).tryParse(x), {
|
|
|
|
|
name: 'tada',
|
|
|
|
|
args: {}
|
|
|
|
|
})),
|
2019-01-31 12:06:13 +09:00
|
|
|
|
bold: r => {
|
|
|
|
|
const asterisk = P.regexp(/\*\*([\s\S]+?)\*\*/, 1);
|
|
|
|
|
const underscore = P.regexp(/__([a-zA-Z0-9\s]+?)__/, 1);
|
|
|
|
|
return P.alt(asterisk, underscore).map(x => createTree('bold', r.inline.atLeast(1).tryParse(x), {}));
|
|
|
|
|
},
|
|
|
|
|
small: r => P.regexp(/<small>([\s\S]+?)<\/small>/, 1).map(x => createTree('small', r.inline.atLeast(1).tryParse(x), {})),
|
|
|
|
|
italic: r => {
|
|
|
|
|
const xml = P.regexp(/<i>([\s\S]+?)<\/i>/, 1);
|
|
|
|
|
const underscore = P((input, i) => {
|
|
|
|
|
const text = input.substr(i);
|
|
|
|
|
const match = text.match(/^(\*|_)([a-zA-Z0-9]+?[\s\S]*?)\1/);
|
|
|
|
|
if (!match) return P.makeFailure(i, 'not a italic');
|
2019-06-16 21:30:51 +09:00
|
|
|
|
if (input[i - 1] != null && input[i - 1] != ' ' && input[i - 1] != '\n') return P.makeFailure(i, 'not a italic');
|
2019-01-31 12:06:13 +09:00
|
|
|
|
return P.makeSuccess(i + match[0].length, match[2]);
|
|
|
|
|
});
|
|
|
|
|
|
|
|
|
|
return P.alt(xml, underscore).map(x => createTree('italic', r.inline.atLeast(1).tryParse(x), {}));
|
|
|
|
|
},
|
2019-06-16 21:42:57 +09:00
|
|
|
|
strike: r => P.regexp(/~~([^\n~]+?)~~/, 1).map(x => createTree('strike', r.inline.atLeast(1).tryParse(x), {})),
|
2019-01-31 12:10:48 +09:00
|
|
|
|
center: r => r.startOfLine.then(P.regexp(/<center>([\s\S]+?)<\/center>/, 1).map(x => createTree('center', r.inline.atLeast(1).tryParse(x), {}))),
|
2019-01-31 12:06:13 +09:00
|
|
|
|
inlineCode: () => P.regexp(/`([^´\n]+?)`/, 1).map(x => createLeaf('inlineCode', { code: x })),
|
2019-01-31 12:10:48 +09:00
|
|
|
|
mathBlock: r => r.startOfLine.then(P.regexp(/\\\[([\s\S]+?)\\\]/, 1).map(x => createLeaf('mathBlock', { formula: x.trim() }))),
|
2019-01-31 12:06:13 +09:00
|
|
|
|
mathInline: () => P.regexp(/\\\((.+?)\\\)/, 1).map(x => createLeaf('mathInline', { formula: x })),
|
|
|
|
|
mention: () => {
|
|
|
|
|
return P((input, i) => {
|
2018-11-21 05:11:00 +09:00
|
|
|
|
const text = input.substr(i);
|
2019-05-05 09:27:55 +09:00
|
|
|
|
const match = text.match(/^@\w([\w-]*\w)?(?:@[\w.\-]+\w)?/);
|
2018-11-21 05:11:00 +09:00
|
|
|
|
if (!match) return P.makeFailure(i, 'not a mention');
|
|
|
|
|
if (input[i - 1] != null && input[i - 1].match(/[a-z0-9]/i)) return P.makeFailure(i, 'not a mention');
|
|
|
|
|
return P.makeSuccess(i + match[0].length, match[0]);
|
2019-01-31 12:06:13 +09:00
|
|
|
|
}).map(x => {
|
2018-11-21 05:11:00 +09:00
|
|
|
|
const { username, host } = parseAcct(x.substr(1));
|
|
|
|
|
const canonical = host != null ? `@${username}@${toUnicode(host)}` : x;
|
2019-01-31 12:06:13 +09:00
|
|
|
|
return createLeaf('mention', { canonical, username, host, acct: x });
|
|
|
|
|
});
|
|
|
|
|
},
|
|
|
|
|
hashtag: () => P((input, i) => {
|
|
|
|
|
const text = input.substr(i);
|
2019-05-05 09:27:55 +09:00
|
|
|
|
const match = text.match(/^#([^\s.,!?'"#:\/\[\]【】]+)/i);
|
2019-01-31 12:06:13 +09:00
|
|
|
|
if (!match) return P.makeFailure(i, 'not a hashtag');
|
|
|
|
|
let hashtag = match[1];
|
|
|
|
|
hashtag = removeOrphanedBrackets(hashtag);
|
2019-09-15 23:33:58 +09:00
|
|
|
|
if (hashtag.match(/^(\u20e3|\ufe0f)/)) return P.makeFailure(i, 'not a hashtag');
|
2019-01-31 12:06:13 +09:00
|
|
|
|
if (hashtag.match(/^[0-9]+$/)) return P.makeFailure(i, 'not a hashtag');
|
|
|
|
|
if (input[i - 1] != null && input[i - 1].match(/[a-z0-9]/i)) return P.makeFailure(i, 'not a hashtag');
|
2019-09-22 01:21:45 +09:00
|
|
|
|
if (Array.from(hashtag || '').length > 128) return P.makeFailure(i, 'not a hashtag');
|
2019-01-31 12:06:13 +09:00
|
|
|
|
return P.makeSuccess(i + ('#' + hashtag).length, createLeaf('hashtag', { hashtag: hashtag }));
|
|
|
|
|
}),
|
|
|
|
|
url: () => {
|
|
|
|
|
return P((input, i) => {
|
2018-11-21 05:11:00 +09:00
|
|
|
|
const text = input.substr(i);
|
2019-03-14 21:23:15 +09:00
|
|
|
|
const match = text.match(urlRegex);
|
|
|
|
|
let url: string;
|
|
|
|
|
if (!match) {
|
|
|
|
|
const match = text.match(/^<(https?:\/\/.*?)>/);
|
2019-06-19 17:47:24 +09:00
|
|
|
|
if (!match) {
|
2019-03-14 21:23:15 +09:00
|
|
|
|
return P.makeFailure(i, 'not a url');
|
2019-06-19 17:47:24 +09:00
|
|
|
|
}
|
2019-03-14 21:23:15 +09:00
|
|
|
|
url = match[1];
|
|
|
|
|
i += 2;
|
2019-06-19 17:47:24 +09:00
|
|
|
|
} else {
|
2019-03-14 21:23:15 +09:00
|
|
|
|
url = match[0];
|
2019-06-19 17:47:24 +09:00
|
|
|
|
}
|
2018-12-22 00:41:54 +09:00
|
|
|
|
url = removeOrphanedBrackets(url);
|
2019-09-27 04:59:40 +09:00
|
|
|
|
url = url.replace(/[.,]*$/, '');
|
2018-11-21 05:11:00 +09:00
|
|
|
|
return P.makeSuccess(i + url.length, url);
|
2019-01-31 12:06:13 +09:00
|
|
|
|
}).map(x => createLeaf('url', { url: x }));
|
|
|
|
|
},
|
|
|
|
|
link: r => {
|
|
|
|
|
return P.seqObj(
|
|
|
|
|
['silent', P.string('?').fallback(null).map(x => x != null)] as any,
|
|
|
|
|
P.string('['), ['text', P.regexp(/[^\n\[\]]+/)] as any, P.string(']'),
|
|
|
|
|
P.string('('), ['url', r.url] as any, P.string(')'),
|
|
|
|
|
).map((x: any) => {
|
|
|
|
|
return createTree('link', r.inline.atLeast(1).tryParse(x.text), {
|
|
|
|
|
silent: x.silent,
|
|
|
|
|
url: x.url.node.props.url
|
|
|
|
|
});
|
|
|
|
|
});
|
|
|
|
|
},
|
|
|
|
|
emoji: () => {
|
|
|
|
|
const name = P.regexp(/:([a-z0-9_+-]+):/i, 1).map(x => createLeaf('emoji', { name: x }));
|
|
|
|
|
const code = P.regexp(emojiRegex).map(x => createLeaf('emoji', { emoji: x }));
|
|
|
|
|
return P.alt(name, code);
|
|
|
|
|
},
|
2020-11-07 23:41:21 +09:00
|
|
|
|
fn: r => {
|
|
|
|
|
return P.seqObj(
|
|
|
|
|
P.string('['), ['fn', P.regexp(/[^\s\n\[\]]+/)] as any, P.string(' '), P.optWhitespace, ['text', P.regexp(/[^\n\[\]]+/)] as any, P.string(']'),
|
|
|
|
|
).map((x: any) => {
|
|
|
|
|
let name = x.fn;
|
|
|
|
|
const args = {};
|
|
|
|
|
const separator = x.fn.indexOf('.');
|
|
|
|
|
if (separator > -1) {
|
|
|
|
|
name = x.fn.substr(0, separator);
|
|
|
|
|
for (const arg of x.fn.substr(separator + 1).split(',')) {
|
|
|
|
|
const kv = arg.split('=');
|
|
|
|
|
if (kv.length === 1) {
|
|
|
|
|
args[kv[0]] = true;
|
|
|
|
|
} else {
|
|
|
|
|
args[kv[0]] = kv[1];
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return createTree('fn', r.inline.atLeast(1).tryParse(x.text), {
|
|
|
|
|
name,
|
|
|
|
|
args
|
|
|
|
|
});
|
|
|
|
|
});
|
|
|
|
|
},
|
2019-01-31 12:06:13 +09:00
|
|
|
|
text: () => P.any.map(x => createLeaf('text', { text: x }))
|
2018-11-21 05:11:00 +09:00
|
|
|
|
});
|