ortools-clone/tools/export_to_ipynb.py

#!/usr/bin/env python3
# Copyright 2010-2025 Google LLC
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Transform any Python sample or example to Python NoteBook."""
import ast
import os
import re
import sys

from nbformat import v3
from nbformat import v4

input_file = sys.argv[1]
print(f"reading {input_file}")
with open(input_file, encoding="utf-8") as fpin:
    text = fpin.read()

# Compute output file path.
output_file = input_file
output_file = output_file.replace(".py", ".ipynb")
# For example/python/foo.py -> example/notebook/examples/foo.ipynb
output_file = output_file.replace("examples/python", "examples/notebook/examples")
# For example/contrib/foo.py -> example/notebook/contrib/foo.ipynb
output_file = output_file.replace("examples/contrib", "examples/notebook/contrib")
# For ortools/*/samples/foo.py -> example/notebook/*/foo.ipynb
output_file = output_file.replace("ortools", "examples/notebook")
output_file = output_file.replace("samples/", "")

nbook = v3.reads_py("")
nbook = v4.upgrade(nbook)  # Upgrade v3 to v4

METADATA = {"language_info": {"name": "python"}}
nbook["metadata"] = METADATA

print("Adding copyright cell...")
GOOGLE = "##### Copyright 2025 Google LLC."
nbook["cells"].append(v4.new_markdown_cell(source=GOOGLE, id="google"))

print("Adding license cell...")
APACHE = """Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""
nbook["cells"].append(v4.new_markdown_cell(source=APACHE, id="apache"))

print("Adding Title cell...")
basename = "# " + os.path.basename(input_file).replace(".py", "")
nbook["cells"].append(v4.new_markdown_cell(source=basename, id="basename"))

print("Adding link cell...")
GITHUB_LOGO = (
    "https://raw.githubusercontent.com/google/or-tools/main/tools/github_32px.png"
)
GITHUB_PATH = "https://github.com/google/or-tools/blob/main/" + input_file

COLAB_PATH = (
    "https://colab.research.google.com/github/google/or-tools/blob/main/" + output_file
)
COLAB_LOGO = (
    "https://raw.githubusercontent.com/google/or-tools/main/tools/colab_32px.png"
)
link = f"""<table align=\"left\">
<td>
<a href=\"{COLAB_PATH}\"><img src=\"{COLAB_LOGO}\"/>Run in Google Colab</a>
</td>
<td>
<a href=\"{GITHUB_PATH}\"><img src=\"{GITHUB_LOGO}\"/>View source on GitHub</a>
</td>
</table>"""
nbook["cells"].append(v4.new_markdown_cell(source=link, id="link"))

print("Adding ortools install cell...")
INSTALL_DOC = (
    "First, you must install "
    "[ortools](https://pypi.org/project/ortools/) package in this "
    "colab."
)
nbook["cells"].append(v4.new_markdown_cell(source=INSTALL_DOC, id="doc"))
INSTALL_CMD = "%pip install ortools"
nbook["cells"].append(v4.new_code_cell(source=INSTALL_CMD, id="install"))

print("Adding code cell...")
all_blocks = ast.parse(text).body
print(f"number of blocks: {len(all_blocks)}")
line_start = [c.lineno - 1 for c in all_blocks]
line_start[0] = 0
lines = text.split("\n")

FULL_TEXT = ""
for idx, (c_block, s, e) in enumerate(
    zip(all_blocks, line_start, line_start[1:] + [len(lines)])
):
    print(f"block[{idx}]: {c_block}")
    c_text = "\n".join(lines[s:e])
    # Clean boilerplate header and description
    if (
        idx == 0
        and isinstance(c_block, ast.Expr)
        and isinstance(c_block.value, ast.Constant)
    ):
        print("Adding description cell...")
        filtered_lines = lines[s:e]
        # filtered_lines = list(
        #    filter(lambda l: not l.startswith('#!'), lines[s:e]))
        filtered_lines = list(
            filter(lambda l: not re.search(r"^#!", l), filtered_lines)
        )
        filtered_lines = list(
            filter(lambda l: not re.search(r"# \[START .*\]$", l), filtered_lines)
        )
        filtered_lines = list(
            filter(lambda l: not re.search(r"# \[END .*\]$", l), filtered_lines)
        )
        # TODO(user): Remove only copyright not all line with '^#'
        filtered_lines = list(filter(lambda l: not l.startswith(r"#"), filtered_lines))
        filtered_lines = [s.replace(r'"""', "") for s in filtered_lines]
        filtered_text = "\n".join(filtered_lines)
        nbook["cells"].append(
            v4.new_markdown_cell(source=filtered_text, id="description")
        )
    # Remove absl app import
    elif (
        isinstance(c_block, ast.ImportFrom)
        and c_block.module == "absl"
        and c_block.names[0].name == "app"
    ):
        print(f"Removing import {c_block.module}.{c_block.names[0].name}...")
    # rewrite absl flag import
    elif (
        isinstance(c_block, ast.ImportFrom)
        and c_block.module == "absl"
        and c_block.names[0].name == "flags"
    ):
        print(f"Rewrite import {c_block.module}.{c_block.names[0].name}...")
        FULL_TEXT += "from ortools.sat.colab import flags\n"
    # Unwrap __main__ function
    elif isinstance(c_block, ast.If) and c_block.test.comparators[0].s == "__main__":
        print("Unwrapping main function...")
        c_lines = lines[s + 1 : e]
        # remove start and de-indent lines
        spaces_to_delete = c_block.body[0].col_offset
        fixed_lines = [
            (
                n_line[spaces_to_delete:]
                if n_line.startswith(" " * spaces_to_delete)
                else n_line
            )
            for n_line in c_lines
        ]
        filtered_lines = fixed_lines
        filtered_lines = list(
            filter(lambda l: not re.search(r"# \[START .*\]$", l), filtered_lines)
        )
        filtered_lines = list(
            filter(lambda l: not re.search(r"# \[END .*\]$", l), filtered_lines)
        )
        filtered_lines = [
            re.sub(r"app.run\((.*)\)$", r"\1()", s) for s in filtered_lines
        ]
        FULL_TEXT += "\n".join(filtered_lines) + "\n"
    # Others
    else:
        print("Appending block...")
        filtered_lines = lines[s:e]
        for i, line in enumerate(filtered_lines):
            filtered_lines[i] = line.replace("DEFINE_", "define_")
        filtered_lines = list(
            filter(lambda l: not re.search(r"# \[START .*\]$", l), filtered_lines)
        )
        filtered_lines = list(
            filter(lambda l: not re.search(r"# \[END .*\]$", l), filtered_lines)
        )
        FULL_TEXT += "\n".join(filtered_lines) + "\n"

nbook["cells"].append(
    v4.new_code_cell(source=FULL_TEXT, id="code")
)

jsonform = v4.writes(nbook) + "\n"

print(f"writing {output_file}")
with open(output_file, mode="w", encoding="utf-8") as fpout:
    fpout.write(jsonform)
Add generate_all_notebook.sh 2020-03-04 13:46:06 +01:00			`#!/usr/bin/env python3`
Bump Copyright to 2025 2025-01-10 11:35:44 +01:00			`# Copyright 2010-2025 Google LLC`
Sync google3 github 2022-06-17 14:23:05 +02:00			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`

Sync g3 -> gh 2020-03-09 11:48:13 +01:00			`"""Transform any Python sample or example to Python NoteBook."""`
updating code to handle script conversion better the code basically leaves out the ``` if __name__=='__main__': ``` block and unwraps any function called main 2018-08-03 10:13:16 +02:00			`import ast`
tools: Update notebook script 2020-09-27 15:38:49 +02:00			`import os`
examples: Fix notebook generation (Fix #3244) 2022-04-13 14:32:40 +02:00			`import re`
sync from g3 2022-05-16 17:44:50 +02:00			`import sys`

Sync g3 -> gh 2020-03-09 11:48:13 +01:00			`from nbformat import v3`
			`from nbformat import v4`
py to ipynb 2017-11-20 17:04:25 +01:00
Sync g3 -> gh 2020-03-09 11:48:13 +01:00			`input_file = sys.argv[1]`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`print(f"reading {input_file}")`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`with open(input_file, encoding="utf-8") as fpin:`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`text = fpin.read()`
py to ipynb 2017-11-20 17:04:25 +01:00
tools: Update notebook script 2020-09-27 15:38:49 +02:00			`# Compute output file path.`
			`output_file = input_file`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`output_file = output_file.replace(".py", ".ipynb")`
tools: Update notebook script 2020-09-27 15:38:49 +02:00			`# For example/python/foo.py -> example/notebook/examples/foo.ipynb`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`output_file = output_file.replace("examples/python", "examples/notebook/examples")`
tools: Update notebook script 2020-09-27 15:38:49 +02:00			`# For example/contrib/foo.py -> example/notebook/contrib/foo.ipynb`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`output_file = output_file.replace("examples/contrib", "examples/notebook/contrib")`
tools: Update notebook script 2020-09-27 15:38:49 +02:00			`# For ortools//samples/foo.py -> example/notebook//foo.ipynb`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`output_file = output_file.replace("ortools", "examples/notebook")`
			`output_file = output_file.replace("samples/", "")`
tools: Update notebook script 2020-09-27 15:38:49 +02:00
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`nbook = v3.reads_py("")`
py to ipynb 2017-11-20 17:04:25 +01:00			`nbook = v4.upgrade(nbook) # Upgrade v3 to v4`

tools: update notebook script 2025-02-04 18:03:49 +01:00			`METADATA = {"language_info": {"name": "python"}}`
			`nbook["metadata"] = METADATA`

tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`print("Adding copyright cell...")`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`GOOGLE = "##### Copyright 2025 Google LLC."`
			`nbook["cells"].append(v4.new_markdown_cell(source=GOOGLE, id="google"))`
tools: Update notebook script 2020-09-27 15:38:49 +02:00
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`print("Adding license cell...")`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`APACHE = """Licensed under the Apache License, Version 2.0 (the "License");`
tools: Update notebook script 2020-09-27 15:38:49 +02:00			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License.`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`"""`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`nbook["cells"].append(v4.new_markdown_cell(source=APACHE, id="apache"))`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00
			`print("Adding Title cell...")`
			`basename = "# " + os.path.basename(input_file).replace(".py", "")`
			`nbook["cells"].append(v4.new_markdown_cell(source=basename, id="basename"))`

			`print("Adding link cell...")`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`GITHUB_LOGO = (`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`"https://raw.githubusercontent.com/google/or-tools/main/tools/github_32px.png"`
			`)`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`GITHUB_PATH = "https://github.com/google/or-tools/blob/main/" + input_file`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00
tools: update notebook script 2025-02-04 18:03:49 +01:00			`COLAB_PATH = (`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`"https://colab.research.google.com/github/google/or-tools/blob/main/" + output_file`
			`)`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`COLAB_LOGO = (`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`"https://raw.githubusercontent.com/google/or-tools/main/tools/colab_32px.png"`
			`)`
			`link = f"""<table align=\"left\">`
tools: Update notebook script 2020-09-27 15:38:49 +02:00			`<td>`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`<a href=\"{COLAB_PATH}\"><img src=\"{COLAB_LOGO}\"/>Run in Google Colab</a>`
tools: Update notebook script 2020-09-27 15:38:49 +02:00			`</td>`
			`<td>`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`<a href=\"{GITHUB_PATH}\"><img src=\"{GITHUB_LOGO}\"/>View source on GitHub</a>`
tools: Update notebook script 2020-09-27 15:38:49 +02:00			`</td>`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`</table>"""`
			`nbook["cells"].append(v4.new_markdown_cell(source=link, id="link"))`

			`print("Adding ortools install cell...")`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`INSTALL_DOC = (`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`"First, you must install "`
			`"[ortools](https://pypi.org/project/ortools/) package in this "`
			`"colab."`
			`)`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`nbook["cells"].append(v4.new_markdown_cell(source=INSTALL_DOC, id="doc"))`
			`INSTALL_CMD = "%pip install ortools"`
			`nbook["cells"].append(v4.new_code_cell(source=INSTALL_CMD, id="install"))`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00
			`print("Adding code cell...")`
updating code to handle script conversion better the code basically leaves out the ``` if __name__=='__main__': ``` block and unwraps any function called main 2018-08-03 10:13:16 +02:00			`all_blocks = ast.parse(text).body`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`print(f"number of blocks: {len(all_blocks)}")`
Sync g3 -> gh 2020-03-09 11:48:13 +01:00			`line_start = [c.lineno - 1 for c in all_blocks]`
Update export_to_ipynb.py fixing script to handle xkcd.py as well 2018-08-03 10:26:25 +02:00			`line_start[0] = 0`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`lines = text.split("\n")`
updating code to handle script conversion better the code basically leaves out the ``` if __name__=='__main__': ``` block and unwraps any function called main 2018-08-03 10:13:16 +02:00
tools: update notebook script 2025-02-04 18:03:49 +01:00			`FULL_TEXT = ""`
examples: Fix notebook generation (Fix #3244) 2022-04-13 14:32:40 +02:00			`for idx, (c_block, s, e) in enumerate(`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`zip(all_blocks, line_start, line_start[1:] + [len(lines)])`
			`):`
			`print(f"block[{idx}]: {c_block}")`
			`c_text = "\n".join(lines[s:e])`
			`# Clean boilerplate header and description`
			`if (`
			`idx == 0`
			`and isinstance(c_block, ast.Expr)`
			`and isinstance(c_block.value, ast.Constant)`
			`):`
			`print("Adding description cell...")`
			`filtered_lines = lines[s:e]`
			`# filtered_lines = list(`
			`# filter(lambda l: not l.startswith('#!'), lines[s:e]))`
			`filtered_lines = list(`
			`filter(lambda l: not re.search(r"^#!", l), filtered_lines)`
			`)`
			`filtered_lines = list(`
			`filter(lambda l: not re.search(r"# \[START .*\]$", l), filtered_lines)`
			`)`
			`filtered_lines = list(`
			`filter(lambda l: not re.search(r"# \[END .*\]$", l), filtered_lines)`
			`)`
			`# TODO(user): Remove only copyright not all line with '^#'`
			`filtered_lines = list(filter(lambda l: not l.startswith(r"#"), filtered_lines))`
			`filtered_lines = [s.replace(r'"""', "") for s in filtered_lines]`
			`filtered_text = "\n".join(filtered_lines)`
			`nbook["cells"].append(`
			`v4.new_markdown_cell(source=filtered_text, id="description")`
			`)`
			`# Remove absl app import`
			`elif (`
			`isinstance(c_block, ast.ImportFrom)`
			`and c_block.module == "absl"`
			`and c_block.names[0].name == "app"`
			`):`
			`print(f"Removing import {c_block.module}.{c_block.names[0].name}...")`
			`# rewrite absl flag import`
			`elif (`
			`isinstance(c_block, ast.ImportFrom)`
			`and c_block.module == "absl"`
			`and c_block.names[0].name == "flags"`
			`):`
			`print(f"Rewrite import {c_block.module}.{c_block.names[0].name}...")`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`FULL_TEXT += "from ortools.sat.colab import flags\n"`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`# Unwrap __main__ function`
			`elif isinstance(c_block, ast.If) and c_block.test.comparators[0].s == "__main__":`
			`print("Unwrapping main function...")`
			`c_lines = lines[s + 1 : e]`
			`# remove start and de-indent lines`
			`spaces_to_delete = c_block.body[0].col_offset`
			`fixed_lines = [`
			`(`
			`n_line[spaces_to_delete:]`
			`if n_line.startswith(" " * spaces_to_delete)`
			`else n_line`
			`)`
			`for n_line in c_lines`
			`]`
			`filtered_lines = fixed_lines`
			`filtered_lines = list(`
			`filter(lambda l: not re.search(r"# \[START .*\]$", l), filtered_lines)`
			`)`
			`filtered_lines = list(`
			`filter(lambda l: not re.search(r"# \[END .*\]$", l), filtered_lines)`
			`)`
			`filtered_lines = [`
			`re.sub(r"app.run\((.*)\)$", r"\1()", s) for s in filtered_lines`
			`]`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`FULL_TEXT += "\n".join(filtered_lines) + "\n"`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`# Others`
			`else:`
			`print("Appending block...")`
			`filtered_lines = lines[s:e]`
			`for i, line in enumerate(filtered_lines):`
			`filtered_lines[i] = line.replace("DEFINE_", "define_")`
			`filtered_lines = list(`
			`filter(lambda l: not re.search(r"# \[START .*\]$", l), filtered_lines)`
			`)`
			`filtered_lines = list(`
			`filter(lambda l: not re.search(r"# \[END .*\]$", l), filtered_lines)`
			`)`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`FULL_TEXT += "\n".join(filtered_lines) + "\n"`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00
tools: update notebook script 2025-02-04 18:03:49 +01:00			`nbook["cells"].append(`
			`v4.new_code_cell(source=FULL_TEXT, id="code")`
			`)`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00
			`jsonform = v4.writes(nbook) + "\n"`

			`print(f"writing {output_file}")`
tools: update notebook script 2025-02-04 18:03:49 +01:00			`with open(output_file, mode="w", encoding="utf-8") as fpout:`
tools: format export_to_ipynb.py 2024-08-12 13:05:21 +02:00			`fpout.write(jsonform)`