NDOJ/judge/markdown.py

import markdown as _markdown
import bleach
from django.utils.html import escape
from bs4 import BeautifulSoup
from pymdownx import superfences


EXTENSIONS = [
    "pymdownx.arithmatex",
    "pymdownx.magiclink",
    "pymdownx.betterem",
    "pymdownx.details",
    "pymdownx.emoji",
    "pymdownx.inlinehilite",
    "pymdownx.superfences",
    "pymdownx.highlight",
    "pymdownx.tasklist",
    "markdown.extensions.footnotes",
    "markdown.extensions.attr_list",
    "markdown.extensions.def_list",
    "markdown.extensions.tables",
    "markdown.extensions.admonition",
    "nl2br",
    "mdx_breakless_lists",
]

EXTENSION_CONFIGS = {
    "pymdownx.superfences": {
        "custom_fences": [
            {
                "name": "sample",
                "class": "no-border",
                "format": superfences.fence_code_format,
            }
        ],
    },
    "pymdownx.highlight": {
        "auto_title": True,
        "auto_title_map": {
            "Text Only": "",
        },
    },
}

ALLOWED_TAGS = list(bleach.sanitizer.ALLOWED_TAGS) + [
    "img",
    "center",
    "iframe",
    "div",
    "span",
    "table",
    "tr",
    "td",
    "th",
    "tr",
    "pre",
    "code",
    "p",
    "hr",
    "h1",
    "h2",
    "h3",
    "h4",
    "h5",
    "h6",
    "thead",
    "tbody",
    "sup",
    "dl",
    "dt",
    "dd",
    "br",
    "details",
    "summary",
]

ALLOWED_ATTRS = ["src", "width", "height", "href", "class", "open"]


def markdown(value, lazy_load=False):
    extensions = EXTENSIONS
    html = _markdown.markdown(
        value, extensions=extensions, extension_configs=EXTENSION_CONFIGS
    )

    # Don't clean mathjax
    hash_script_tag = {}
    soup = BeautifulSoup(html, "html.parser")
    for script_tag in soup.find_all("script"):
        allow_math_types = ["math/tex", "math/tex; mode=display"]
        if script_tag.attrs.get("type", False) in allow_math_types:
            hash_script_tag[str(hash(str(script_tag)))] = str(script_tag)

    for hashed_tag in hash_script_tag:
        tag = hash_script_tag[hashed_tag]
        html = html.replace(tag, hashed_tag)

    html = bleach.clean(html, tags=ALLOWED_TAGS, attributes=ALLOWED_ATTRS)

    for hashed_tag in hash_script_tag:
        tag = hash_script_tag[hashed_tag]
        html = html.replace(hashed_tag, tag)

    if not html:
        html = escape(value)
    if lazy_load:
        soup = BeautifulSoup(html, features="html.parser")
        for img in soup.findAll("img"):
            if img.get("src"):
                img["data-src"] = img["src"]
                img["src"] = ""
        for img in soup.findAll("iframe"):
            if img.get("src"):
                img["data-src"] = img["src"]
                img["src"] = ""
        html = str(soup)
    return '<div class="md-typeset content-description">%s</div>' % html
Change pre code css in markdown 2024-01-18 19:46:41 -06:00			`import markdown as _markdown`
			`import bleach`
			`from django.utils.html import escape`
			`from bs4 import BeautifulSoup`
			`from pymdownx import superfences`


			`EXTENSIONS = [`
			`"pymdownx.arithmatex",`
			`"pymdownx.magiclink",`
			`"pymdownx.betterem",`
			`"pymdownx.details",`
			`"pymdownx.emoji",`
			`"pymdownx.inlinehilite",`
			`"pymdownx.superfences",`
			`"pymdownx.highlight",`
			`"pymdownx.tasklist",`
			`"markdown.extensions.footnotes",`
			`"markdown.extensions.attr_list",`
			`"markdown.extensions.def_list",`
			`"markdown.extensions.tables",`
			`"markdown.extensions.admonition",`
			`"nl2br",`
			`"mdx_breakless_lists",`
			`]`

			`EXTENSION_CONFIGS = {`
			`"pymdownx.superfences": {`
			`"custom_fences": [`
			`{`
			`"name": "sample",`
			`"class": "no-border",`
			`"format": superfences.fence_code_format,`
			`}`
			`],`
			`},`
			`"pymdownx.highlight": {`
			`"auto_title": True,`
			`"auto_title_map": {`
			`"Text Only": "",`
			`},`
			`},`
			`}`

			`ALLOWED_TAGS = list(bleach.sanitizer.ALLOWED_TAGS) + [`
			`"img",`
			`"center",`
			`"iframe",`
			`"div",`
			`"span",`
			`"table",`
			`"tr",`
			`"td",`
			`"th",`
			`"tr",`
			`"pre",`
			`"code",`
			`"p",`
			`"hr",`
			`"h1",`
			`"h2",`
			`"h3",`
			`"h4",`
			`"h5",`
			`"h6",`
			`"thead",`
			`"tbody",`
			`"sup",`
			`"dl",`
			`"dt",`
			`"dd",`
			`"br",`
			`"details",`
			`"summary",`
			`]`

			`ALLOWED_ATTRS = ["src", "width", "height", "href", "class", "open"]`


			`def markdown(value, lazy_load=False):`
			`extensions = EXTENSIONS`
			`html = _markdown.markdown(`
			`value, extensions=extensions, extension_configs=EXTENSION_CONFIGS`
			`)`

			`# Don't clean mathjax`
			`hash_script_tag = {}`
			`soup = BeautifulSoup(html, "html.parser")`
			`for script_tag in soup.find_all("script"):`
			`allow_math_types = ["math/tex", "math/tex; mode=display"]`
			`if script_tag.attrs.get("type", False) in allow_math_types:`
			`hash_script_tag[str(hash(str(script_tag)))] = str(script_tag)`

			`for hashed_tag in hash_script_tag:`
			`tag = hash_script_tag[hashed_tag]`
			`html = html.replace(tag, hashed_tag)`

			`html = bleach.clean(html, tags=ALLOWED_TAGS, attributes=ALLOWED_ATTRS)`

			`for hashed_tag in hash_script_tag:`
			`tag = hash_script_tag[hashed_tag]`
			`html = html.replace(hashed_tag, tag)`

			`if not html:`
			`html = escape(value)`
			`if lazy_load:`
			`soup = BeautifulSoup(html, features="html.parser")`
			`for img in soup.findAll("img"):`
			`if img.get("src"):`
			`img["data-src"] = img["src"]`
			`img["src"] = ""`
			`for img in soup.findAll("iframe"):`
			`if img.get("src"):`
			`img["data-src"] = img["src"]`
			`img["src"] = ""`
			`html = str(soup)`
			`return '<div class="md-typeset content-description">%s</div>' % html`