File size: 4,648 Bytes
db5855f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
import argparse
import shutil
import subprocess  # nosec - disable B404:import-subprocess check
import time
from pathlib import Path
import nbformat


def disable_gradio_debug(notebook_path):
    nb = nbformat.read(notebook_path, as_version=nbformat.NO_CONVERT)
    found = False
    for cell in nb["cells"]:
        if "gradio" in cell["source"] and "debug" in cell["source"]:
            found = True
            cell["source"] = cell["source"].replace("debug=True", "debug=False")

    if found:
        print(f"Disabled gradio debug mode for {notebook_path}")
        nbformat.write(nb, str(notebook_path), version=nbformat.NO_CONVERT)


def arguments():
    parser = argparse.ArgumentParser()
    parser.add_argument("--exclude_execution_file")
    parser.add_argument("--exclude_conversion_file")
    parser.add_argument("--timeout", type=float, default=7200, help="timeout for notebook execution")
    parser.add_argument("--rst_dir", type=Path, help="rst files output directory", default=Path("rst"))

    return parser.parse_args()


def prepare_ignore_list(input_file):
    with Path(input_file).open("r") as f:
        lines = f.readlines()
    return list(map(str.strip, lines))


def main():
    args = arguments()
    ignore_conversion_list = []
    ignore_execution_list = []
    failed_notebooks = []
    rst_failed = []
    if args.exclude_conversion_file is not None:
        ignore_conversion_list = prepare_ignore_list(args.exclude_conversion_file)
    if args.exclude_execution_file is not None:
        ignore_execution_list = prepare_ignore_list(args.exclude_execution_file)
    root = Path(__file__).parents[1]
    notebooks_dir = root / "notebooks"
    notebooks = sorted(list(notebooks_dir.rglob("**/*.ipynb")))
    for notebook in notebooks:
        notebook_path = notebook.relative_to(root)
        if str(notebook_path) in ignore_conversion_list:
            continue
        disable_gradio_debug(notebook_path)
        notebook_executed = notebook_path.parent / notebook_path.name.replace(".ipynb", "-with-output.ipynb")
        start = time.perf_counter()
        print(f"Convert {notebook_path}")
        if str(notebook_path) not in ignore_execution_list:
            try:
                retcode = subprocess.run(
                    [
                        "jupyter",
                        "nbconvert",
                        "--log-level=INFO",
                        "--execute",
                        "--to",
                        "notebook",
                        "--output",
                        str(notebook_executed),
                        "--output-dir",
                        str(root),
                        "--ExecutePreprocessor.kernel_name=python3",
                        str(notebook_path),
                    ],
                    timeout=args.timeout,
                ).returncode
            except subprocess.TimeoutExpired:
                retcode = -42
                print(f"TIMEOUT: {notebook_path}")
            if retcode:
                failed_notebooks.append(str(notebook_path))
                continue
        else:
            shutil.copyfile(notebook_path, notebook_executed)
        rst_retcode = subprocess.run(
            [
                "jupyter",
                "nbconvert",
                "--to",
                "rst",
                str(notebook_executed),
                "--output-dir",
                str(args.rst_dir),
                "--TagRemovePreprocessor.remove_all_outputs_tags=hide_output --TagRemovePreprocessor.enabled=True",
            ],
            timeout=args.timeout,
        ).returncode
        notebook_rst = args.rst_dir / notebook_executed.name.replace(".ipynb", ".rst")
        # remove all non-printable characters
        subprocess.run(
            [
                "sed",
                "-i",
                "-e",
                "s/\x1b\[[0-9;]*m//g",
                "-e",
                "s/\x1b\[?25h//g",
                "-e",
                "s/\x1b\[?25l//g",
                str(notebook_rst),
            ],
            timeout=args.timeout,
        )

        end = time.perf_counter() - start
        print(f"Notebook conversion took: {end:.4f} s")
        if rst_retcode:
            rst_failed.append(str(notebook_path))

    if failed_notebooks:
        print("EXECUTION FAILED:")
        print("\n".join(failed_notebooks))

    if rst_failed:
        print("RST CONVERSION FAILED:")
        print("\n".join(rst_failed))


if __name__ == "__main__":
    main()