// This contains zulip's frontend markdown implementation; see // docs/subsystems/markdown.md for docs on our Markdown syntax. The other // main piece in rendering markdown client-side is // static/third/marked/lib/marked.js, which we have significantly // modified from the original implementation. var markdown = (function () { var exports = {}; var realm_filter_map = {}; var realm_filter_list = []; // Helper function function escape(html, encode) { return html .replace(!encode ? /&(?!#?\w+;)/g : /&/g, '&') .replace(//g, '>') .replace(/"/g, '"') .replace(/'/g, '''); } // Regexes that match some of our common bugdown markup var backend_only_markdown_re = [ // Inline image previews, check for contiguous chars ending in image suffix // To keep the below regexes simple, split them out for the end-of-message case /[^\s]*(?:(?:\.bmp|\.gif|\.jpg|\.jpeg|\.png|\.webp)\)?)\s+/m, /[^\s]*(?:(?:\.bmp|\.gif|\.jpg|\.jpeg|\.png|\.webp)\)?)$/m, // Twitter and youtube links are given previews /[^\s]*(?:twitter|youtube).com\/[^\s]*/, ]; exports.contains_backend_only_syntax = function (content) { // Try to guess whether or not a message has bugdown in it // If it doesn't, we can immediately render it client-side var markedup = _.find(backend_only_markdown_re, function (re) { return re.test(content); }); // If a realm filter doesn't start with some specified characters // then don't render it locally. It is workaround for the fact that // javascript regex doesn't support lookbehind. var false_filter_match = _.find(realm_filter_list, function (re) { var pattern = /(?:[^\s'"\(,:<])/.source + re[0].source + /(?![\w])/.source; var regex = new RegExp(pattern); return regex.test(content); }); return markedup !== undefined || false_filter_match !== undefined; }; exports.apply_markdown = function (message) { message_store.init_booleans(message); // Our python-markdown processor appends two \n\n to input var options = { userMentionHandler: function (name) { var person = people.get_by_name(name); if (person !== undefined) { if (people.is_my_user_id(person.user_id)) { message.mentioned = true; message.mentioned_me_directly = true; } return '' + '@' + escape(person.full_name, true) + ''; } else if (name === 'all' || name === 'everyone' || name === 'stream') { message.mentioned = true; return '' + '@' + name + ''; } return; }, groupMentionHandler: function (name) { var group = user_groups.get_user_group_from_name(name); if (group !== undefined) { if (user_groups.is_member_of(group.id, people.my_current_user_id())) { message.mentioned = true; } return '' + '@' + escape(group.name, true) + ''; } return; }, }; message.content = marked(message.raw_content + '\n\n', options).trim(); message.is_me_message = exports.is_status_message(message.raw_content, message.content); }; exports.add_subject_links = function (message) { if (message.type !== 'stream') { message.subject_links = []; return; } var subject = message.subject; var links = []; _.each(realm_filter_list, function (realm_filter) { var pattern = realm_filter[0]; var url = realm_filter[1]; var match; while ((match = pattern.exec(subject)) !== null) { var link_url = url; var matched_groups = match.slice(1); var i = 0; while (i < matched_groups.length) { var matched_group = matched_groups[i]; var current_group = i + 1; var back_ref = "\\" + current_group; link_url = link_url.replace(back_ref, matched_group); i += 1; } links.push(link_url); } }); message.subject_links = links; }; exports.is_status_message = function (raw_content, content) { return raw_content.indexOf('/me ') === 0 && raw_content.indexOf('\n') === -1 && content.indexOf('

') === 0 && content.lastIndexOf('

') === content.length - 4; }; function handleUnicodeEmoji(unicode_emoji) { var codepoint = unicode_emoji.codePointAt(0).toString(16); if (emoji_codes.codepoint_to_name.hasOwnProperty(codepoint)) { var emoji_name = emoji_codes.codepoint_to_name[codepoint]; var alt_text = ':' + emoji_name + ':'; var title = emoji_name.split("_").join(" "); return '' + alt_text + ''; } return unicode_emoji; } function handleEmoji(emoji_name) { var alt_text = ':' + emoji_name + ':'; var title = emoji_name.split("_").join(" "); if (emoji.active_realm_emojis.hasOwnProperty(emoji_name)) { var emoji_url = emoji.active_realm_emojis[emoji_name].emoji_url; return '' + alt_text + ''; } else if (emoji_codes.name_to_codepoint.hasOwnProperty(emoji_name)) { var codepoint = emoji_codes.name_to_codepoint[emoji_name]; return '' + alt_text + ''; } return alt_text; } function handleAvatar(email) { return '' + email + ''; } function handleStream(streamName) { var stream = stream_data.get_sub(streamName); if (stream === undefined) { return; } var href = window.location.origin + '/#narrow/stream/' + hash_util.encode_stream_name(stream.name); return '' + '#' + escape(stream.name) + ''; } function handleRealmFilter(pattern, matches) { var url = realm_filter_map[pattern]; var current_group = 1; _.each(matches, function (match) { var back_ref = "\\" + current_group; url = url.replace(back_ref, match); current_group += 1; }); return url; } function handleTex(tex, fullmatch) { try { return katex.renderToString(tex); } catch (ex) { if (ex.message.indexOf('KaTeX parse error') === 0) { // TeX syntax error return '' + escape(fullmatch) + ''; } blueslip.error(ex); } } function python_to_js_filter(pattern, url) { // Converts a python named-group regex to a javascript-compatible numbered // group regex... with a regex! var named_group_re = /\(?P<([^>]+?)>/g; var match = named_group_re.exec(pattern); var current_group = 1; while (match) { var name = match[1]; // Replace named group with regular matching group pattern = pattern.replace('(?P<' + name + '>', '('); // Replace named reference in url to numbered reference url = url.replace('%(' + name + ')s', '\\' + current_group); match = named_group_re.exec(pattern); current_group += 1; } // Convert any python in-regex flags to RegExp flags var js_flags = 'g'; var inline_flag_re = /\(\?([iLmsux]+)\)/; match = inline_flag_re.exec(pattern); // JS regexes only support i (case insensitivity) and m (multiline) // flags, so keep those and ignore the rest if (match) { var py_flags = match[1].split(""); _.each(py_flags, function (flag) { if ("im".indexOf(flag) !== -1) { js_flags += flag; } }); pattern = pattern.replace(inline_flag_re, ""); } // Ideally we should have been checking that realm filters // begin with certain characters but since there is no // support for negative lookbehind in javascript, we check // for this condition in `contains_backend_only_syntax()` // function. If the condition is satisfied then the message // is rendered locally, otherwise, we return false there and // message is rendered on the backend which has proper support // for negative lookbehind. pattern = pattern + /(?![\w])/.source; return [new RegExp(pattern, js_flags), url]; } exports.set_realm_filters = function (realm_filters) { // Update the marked parser with our particular set of realm filters realm_filter_map = {}; realm_filter_list = []; var marked_rules = []; _.each(realm_filters, function (realm_filter) { var pattern = realm_filter[0]; var url = realm_filter[1]; var js_filters = python_to_js_filter(pattern, url); realm_filter_map[js_filters[0]] = js_filters[1]; realm_filter_list.push([js_filters[0], js_filters[1]]); marked_rules.push(js_filters[0]); }); marked.InlineLexer.rules.zulip.realm_filters = marked_rules; }; var preprocess_auto_olists = (function () { var TAB_LENGTH = 2; var re = /^( *)(\d+)\. +(.*)/; function getIndent(match) { return Math.floor(match[1].length / TAB_LENGTH); } function extendArray(arr, arr2) { Array.prototype.push.apply(arr, arr2); } function renumber(mlist) { if (!mlist.length) { return []; } var startNumber = parseInt(mlist[0][2], 10); var changeNumbers = _.every(mlist, function (m) { return startNumber === parseInt(m[2], 10); }); var counter = startNumber; return _.map(mlist, function (m) { var number = changeNumbers ? counter.toString() : m[2]; counter += 1; return m[1] + number + '. ' + m[3]; }); } return function (src) { var newLines = []; var currentList = []; var currentIndent = 0; _.each(src.split('\n'), function (line) { var m = line.match(re); var isNextItem = m && currentList.length && currentIndent === getIndent(m); if (!isNextItem) { extendArray(newLines, renumber(currentList)); currentList = []; } if (!m) { newLines.push(line); } else if (isNextItem) { currentList.push(m); } else { currentList = [m]; currentIndent = getIndent(m); } }); extendArray(newLines, renumber(currentList)); return newLines.join('\n'); }; }()); exports.initialize = function () { function disable_markdown_regex(rules, name) { rules[name] = {exec: function () { return false; }}; } // Configure the marked markdown parser for our usage var r = new marked.Renderer(); // No around our code blocks instead a codehilite
and disable // class-specific highlighting. r.code = function (code) { return '
'
          + escape(code, true)
          + '\n
\n\n\n'; }; // Our links have title= and target=_blank r.link = function (href, title, text) { title = title || href; var out = '' + text + ''; return out; }; // Put a newline after a
in the generated HTML to match bugdown r.br = function () { return '
\n'; }; function preprocess_code_blocks(src) { return fenced_code.process_fenced_code(src); } function preprocess_translate_emoticons(src) { if (!page_params.translate_emoticons) { return src; } // In this scenario, the message has to be from the user, so the only // requirement should be that they have the setting on. return emoji.translate_emoticons_to_names(src); } // Disable ordered lists // We used GFM + tables, so replace the list start regex for that ruleset // We remove the |[\d+]\. that matches the numbering in a numbered list marked.Lexer.rules.tables.list = /^( *)((?:\*)) [\s\S]+?(?:\n+(?=(?: *[\-*_]){3,} *(?:\n+|$))|\n{2,}(?! )(?!\1(?:\*) )\n*|\s*$)/; // Disable headings disable_markdown_regex(marked.Lexer.rules.tables, 'heading'); disable_markdown_regex(marked.Lexer.rules.tables, 'lheading'); // Disable __strong__ (keeping **strong**) marked.InlineLexer.rules.zulip.strong = /^\*\*([\s\S]+?)\*\*(?!\*)/; // Make sure syntax matches the backend processor marked.InlineLexer.rules.zulip.del = /^(?!<\~)\~\~([^~]+)\~\~(?!\~)/; // Disable _emphasis_ (keeping *emphasis*) // Text inside ** must start and end with a word character // to prevent mis-parsing things like "char **x = (char **)y" marked.InlineLexer.rules.zulip.em = /^\*(?!\s+)((?:\*\*|[\s\S])+?)((?:[\S]))\*(?!\*)/; // Disable autolink as (a) it is not used in our backend and (b) it interferes with @mentions disable_markdown_regex(marked.InlineLexer.rules.zulip, 'autolink'); exports.set_realm_filters(page_params.realm_filters); // Tell our fenced code preprocessor how to insert arbitrary // HTML into the output. This generated HTML is safe to not escape fenced_code.set_stash_func(function (html) { return marked.stashHtml(html, true); }); fenced_code.set_escape_func(escape); marked.setOptions({ gfm: true, tables: true, breaks: true, pedantic: false, sanitize: true, smartLists: true, smartypants: false, zulip: true, emojiHandler: handleEmoji, avatarHandler: handleAvatar, unicodeEmojiHandler: handleUnicodeEmoji, streamHandler: handleStream, realmFilterHandler: handleRealmFilter, texHandler: handleTex, renderer: r, preprocessors: [ preprocess_code_blocks, preprocess_auto_olists, preprocess_translate_emoticons, ], }); }; return exports; }()); if (typeof module !== 'undefined') { module.exports = markdown; } window.markdown = markdown;