blender-projects-gitea-custom/sphinx/sphinx_to_html.py

#!/usr/bin/python3

import argparse
import html
import os
import pathlib
import re
import shutil
import subprocess
import sys
import tempfile

page_contents = sys.stdin.read()

base_url = "https://projects.blender.org"
uatest_base_url = "https://uatest.projects.blender.org"
local_url = "http://localhost:3000"
placeholder_url = "https://placeholder.org"

# Gitea sets this environment variable with the URL prefix for the current file.
gitea_prefix = os.environ.get("GITEA_PREFIX_SRC", "")
if gitea_prefix.startswith(base_url):
    gitea_prefix = gitea_prefix[len(base_url):]
if gitea_prefix.startswith(uatest_base_url):
    gitea_prefix = gitea_prefix[len(uatest_base_url):]
if gitea_prefix.startswith(local_url):
    gitea_prefix = gitea_prefix[len(local_url):]

if len(gitea_prefix):
    path_tokens = gitea_prefix.strip('/').split('/')
    org, repo, view, ref, branch = path_tokens[:5]

    doc_url = f"{base_url}/{org}/{repo}/{view}/{ref}/{branch}"
    image_url = f"{base_url}/{org}/{repo}/media/{ref}/{branch}"

    # Hardcoded exception for blender-manual, that has links relative
    # to manual/ folder.
    if len(path_tokens) > 5 and path_tokens[5] == 'manual':
        doc_url += "/manual"
        image_url += "/manual"
else:
    doc_url = ""
    image_url = ""

# Set up temporary directory with sphinx configuration.
with tempfile.TemporaryDirectory() as tmp_dir:
    work_dir = pathlib.Path(tmp_dir) / "work"

    script_dir = pathlib.Path(__file__).parent.resolve()
    shutil.copytree(script_dir / "template", work_dir)
    page_filepath = work_dir / "contents.rst"

    # Turn links into external links since internal links are not found and stripped.
    def path_to_label(path):
        path = path.removesuffix('/index')
        return path.split('/')[-1].replace('_', ' ').replace('-', ' ').capitalize()
    def doc_label_link(matchobj):
        return f"`{matchobj.group(1)}<{doc_url}/{matchobj.group(2).strip('/')}.rst>`_"
    def doc_link(matchobj):
        return f"`{path_to_label(matchobj.group(1))} <{doc_url}/{matchobj.group(1).strip('/')}.rst>`_"
    def ref_label_link(matchobj):
        return f"`{matchobj.group(1)} <{placeholder_url}>`_"
    def ref_link(matchobj):
        return f"`{path_to_label(matchobj.group(1))} <{placeholder_url}>`_"
    def term_link(matchobj):
        return f"`{matchobj.group(1)} <{placeholder_url}>`_"
    def figure_link(matchobj):
        return f"figure:: {image_url}/{matchobj.group(1).strip('/')}"
    def image_link(matchobj):
        return f"image:: {image_url}/{matchobj.group(1).strip('/')}"

    page_contents = re.sub(":doc:`/(.+?)`", doc_link, page_contents)
    page_contents = re.sub(":doc:`([\w\s\n-]+?)\n?<(.+?)>`", doc_label_link, page_contents)
    page_contents = re.sub(":ref:`([\w\s\n-]+?)\n?<(.+?)>`", ref_label_link, page_contents)
    page_contents = re.sub(":ref:`([\w\s-]+?)`", ref_link, page_contents)
    page_contents = re.sub(":term:`([\w\s\n-]+?)\n?<(.+?)>`", term_link, page_contents)
    page_contents = re.sub(":term:`([\w\s-]+?)`", term_link, page_contents)
    page_contents = re.sub("figure:: (.+?)", figure_link, page_contents)
    page_contents = re.sub("image:: (.+?)", image_link, page_contents)

    # Disable include directives and raw for security. They are already disabled
    # by docutils.py, this is just to be extra careful.
    def include_directive(matchobj):
        return f"warning:: include not available in preview: {html.escape(matchobj.group(1))}"
    def raw_directive(matchobj):
        return f"warning:: raw not available in preview: {html.escape(matchobj.group(1))}"
    page_contents = re.sub("literalinclude::(.*)", include_directive, page_contents)
    page_contents = re.sub("include::(.*)", include_directive, page_contents)
    page_contents = re.sub("raw::(.*)", raw_directive, page_contents)
    page_contents = re.sub(".. toctree::(.*)", ".. code-block:: none", page_contents)
    page_contents = re.sub(":maxdepth:(.*)", "", page_contents)
    page_contents = page_contents.replace("|BLENDER_VERSION|", "BLENDER_VERSION")

    page_filepath.write_text(page_contents)

    # Debug processed RST
    # print(html.escape(page_contents).replace('\n', '<br/>\n'))
    # sys.exit(0)

    # Run sphinx-build.
    out_dir = work_dir / "out"
    out_filepath = out_dir / "contents.html"

    sphinx_build = script_dir / "venv" / "bin" / "sphinx-build"
    sphinx_cmd = [sphinx_build, "-b", "html", work_dir, out_dir]
    result = subprocess.run(sphinx_cmd, capture_output=True)

    # Output errors.
    error = result.stderr.decode("utf-8", "ignore").strip()
    if len(error):
        error = error.replace(str(page_filepath) + ":", "")
        error = html.escape(error)
        print("<h2>Sphinx Warnings</h2>\n")
        print(f"<pre>{error}</pre>")
        print("<p>Note the preview is not accurate and warnings may not indicate real issues.</p>")

    # Output contents of body.
    if result.returncode == 0 and out_filepath.is_file():
        contents = out_filepath.read_text()
        body = contents.split("<body>")[1].split("</body>")[0]
        body = body.replace(f'href="{placeholder_url}', 'href="#link-not-available-in-preview"')
        body = body.replace('href="http', 'target="_blank" href="http')
        body = '<div class="restructuredtext">' + body + '</div>'
        print(body)
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			`#!/usr/bin/python3`

			`import argparse`
			`import html`
			`import os`
			`import pathlib`
			`import re`
			`import shutil`
			`import subprocess`
			`import sys`
			`import tempfile`

Sphinx: simplify running process as another user 2023-05-09 09:45:35 -05:00			`page_contents = sys.stdin.read()`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00
			`base_url = "https://projects.blender.org"`
Fix problem displaying images in RST preview 2023-05-25 05:59:48 -05:00			`uatest_base_url = "https://uatest.projects.blender.org"`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			`local_url = "http://localhost:3000"`
			`placeholder_url = "https://placeholder.org"`

			`# Gitea sets this environment variable with the URL prefix for the current file.`
			`gitea_prefix = os.environ.get("GITEA_PREFIX_SRC", "")`
			`if gitea_prefix.startswith(base_url):`
			`gitea_prefix = gitea_prefix[len(base_url):]`
Fix problem displaying images in RST preview 2023-05-25 05:59:48 -05:00			`if gitea_prefix.startswith(uatest_base_url):`
			`gitea_prefix = gitea_prefix[len(uatest_base_url):]`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			`if gitea_prefix.startswith(local_url):`
			`gitea_prefix = gitea_prefix[len(local_url):]`

			`if len(gitea_prefix):`
Fix various issues in Sphinx .rst rendering for the blender-manual repo 2023-04-06 12:36:58 -05:00			`path_tokens = gitea_prefix.strip('/').split('/')`
			`org, repo, view, ref, branch = path_tokens[:5]`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00
			`doc_url = f"{base_url}/{org}/{repo}/{view}/{ref}/{branch}"`
Fix various issues in Sphinx .rst rendering for the blender-manual repo 2023-04-06 12:36:58 -05:00			`image_url = f"{base_url}/{org}/{repo}/media/{ref}/{branch}"`

			`# Hardcoded exception for blender-manual, that has links relative`
			`# to manual/ folder.`
			`if len(path_tokens) > 5 and path_tokens[5] == 'manual':`
			`doc_url += "/manual"`
			`image_url += "/manual"`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			`else:`
			`doc_url = ""`
			`image_url = ""`

			`# Set up temporary directory with sphinx configuration.`
Sphinx: simplify running process as another user 2023-05-09 09:45:35 -05:00			`with tempfile.TemporaryDirectory() as tmp_dir:`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			`work_dir = pathlib.Path(tmp_dir) / "work"`

			`script_dir = pathlib.Path(__file__).parent.resolve()`
			`shutil.copytree(script_dir / "template", work_dir)`
			`page_filepath = work_dir / "contents.rst"`

			`# Turn links into external links since internal links are not found and stripped.`
Fix various issues in Sphinx .rst rendering for the blender-manual repo 2023-04-06 12:36:58 -05:00			`def path_to_label(path):`
			`path = path.removesuffix('/index')`
			`return path.split('/')[-1].replace('_', ' ').replace('-', ' ').capitalize()`
			`def doc_label_link(matchobj):`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			return f"`{matchobj.group(1)}<{doc_url}/{matchobj.group(2).strip('/')}.rst>`_"
Fix various issues in Sphinx .rst rendering for the blender-manual repo 2023-04-06 12:36:58 -05:00			`def doc_link(matchobj):`
			return f"`{path_to_label(matchobj.group(1))} <{doc_url}/{matchobj.group(1).strip('/')}.rst>`_"
			`def ref_label_link(matchobj):`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			return f"`{matchobj.group(1)} <{placeholder_url}>`_"
Fix various issues in Sphinx .rst rendering for the blender-manual repo 2023-04-06 12:36:58 -05:00			`def ref_link(matchobj):`
			return f"`{path_to_label(matchobj.group(1))} <{placeholder_url}>`_"
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			`def term_link(matchobj):`
			return f"`{matchobj.group(1)} <{placeholder_url}>`_"
			`def figure_link(matchobj):`
			`return f"figure:: {image_url}/{matchobj.group(1).strip('/')}"`
			`def image_link(matchobj):`
			`return f"image:: {image_url}/{matchobj.group(1).strip('/')}"`

Fix various issues in Sphinx .rst rendering for the blender-manual repo 2023-04-06 12:36:58 -05:00			page_contents = re.sub(":doc:`/(.+?)`", doc_link, page_contents)
Fix some unecessary Sphinx warnings in RST preview 2023-05-25 12:07:41 -05:00			page_contents = re.sub(":doc:`([\w\s\n-]+?)\n?<(.+?)>`", doc_label_link, page_contents)
			page_contents = re.sub(":ref:`([\w\s\n-]+?)\n?<(.+?)>`", ref_label_link, page_contents)
Fix various issues in Sphinx .rst rendering for the blender-manual repo 2023-04-06 12:36:58 -05:00			page_contents = re.sub(":ref:`([\w\s-]+?)`", ref_link, page_contents)
Fix some unecessary Sphinx warnings in RST preview 2023-05-25 12:07:41 -05:00			page_contents = re.sub(":term:`([\w\s\n-]+?)\n?<(.+?)>`", term_link, page_contents)
Fix various issues in Sphinx .rst rendering for the blender-manual repo 2023-04-06 12:36:58 -05:00			page_contents = re.sub(":term:`([\w\s-]+?)`", term_link, page_contents)
			`page_contents = re.sub("figure:: (.+?)", figure_link, page_contents)`
			`page_contents = re.sub("image:: (.+?)", image_link, page_contents)`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00
			`# Disable include directives and raw for security. They are already disabled`
			`# by docutils.py, this is just to be extra careful.`
			`def include_directive(matchobj):`
Fix issues with links, includes and notes in Sphinx .rst preview styling 2023-03-13 18:58:31 -05:00			`return f"warning:: include not available in preview: {html.escape(matchobj.group(1))}"`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			`def raw_directive(matchobj):`
Fix issues with links, includes and notes in Sphinx .rst preview styling 2023-03-13 18:58:31 -05:00			`return f"warning:: raw not available in preview: {html.escape(matchobj.group(1))}"`
			`page_contents = re.sub("literalinclude::(.*)", include_directive, page_contents)`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			`page_contents = re.sub("include::(.*)", include_directive, page_contents)`
			`page_contents = re.sub("raw::(.*)", raw_directive, page_contents)`
Fix some unecessary Sphinx warnings in RST preview 2023-05-25 12:07:41 -05:00			`page_contents = re.sub(".. toctree::(.*)", ".. code-block:: none", page_contents)`
			`page_contents = re.sub(":maxdepth:(.*)", "", page_contents)`
			`page_contents = page_contents.replace("\|BLENDER_VERSION\|", "BLENDER_VERSION")`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00
			`page_filepath.write_text(page_contents)`

			`# Debug processed RST`
			`# print(html.escape(page_contents).replace('\n', '<br/>\n'))`
			`# sys.exit(0)`

			`# Run sphinx-build.`
			`out_dir = work_dir / "out"`
			`out_filepath = out_dir / "contents.html"`

Fix sphinx-build not found in Python venv 2023-05-25 05:26:56 -05:00			`sphinx_build = script_dir / "venv" / "bin" / "sphinx-build"`
			`sphinx_cmd = [sphinx_build, "-b", "html", work_dir, out_dir]`
Sphinx: simplify running process as another user 2023-05-09 09:45:35 -05:00			`result = subprocess.run(sphinx_cmd, capture_output=True)`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00
			`# Output errors.`
			`error = result.stderr.decode("utf-8", "ignore").strip()`
			`if len(error):`
			`error = error.replace(str(page_filepath) + ":", "")`
			`error = html.escape(error)`
			`print("<h2>Sphinx Warnings</h2>\n")`
			`print(f"<pre>{error}</pre>")`
			`print("<p>Note the preview is not accurate and warnings may not indicate real issues.</p>")`

			`# Output contents of body.`
			`if result.returncode == 0 and out_filepath.is_file():`
			`contents = out_filepath.read_text()`
			`body = contents.split("<body>")[1].split("</body>")[0]`
Fix issues with links, includes and notes in Sphinx .rst preview styling 2023-03-13 18:58:31 -05:00			`body = body.replace(f'href="{placeholder_url}', 'href="#link-not-available-in-preview"')`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			`body = body.replace('href="http', 'target="_blank" href="http')`
Fix issues with links, includes and notes in Sphinx .rst preview styling 2023-03-13 18:58:31 -05:00			`body = '<div class="restructuredtext">' + body + '</div>'`
Add renderer for Sphinx .rst files, for user manual previews Ref infrastructure/blender-projects-platform#51 Pull Request: https://projects.blender.org/infrastructure/gitea-custom/pulls/2 2023-03-09 12:18:50 -05:00			`print(body)`