forked from rasbt/python-machine-learning-book-3rd-edition
-
Notifications
You must be signed in to change notification settings - Fork 65
/
.convert_notebook_to_script.py
78 lines (59 loc) · 2.26 KB
/
.convert_notebook_to_script.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
# Simple helper script to convert
# a Jupyter notebook to Python
#
# Sebastian Raschka, 2017
import argparse
import os
import subprocess
def convert(input_path, output_path):
subprocess.call(['jupyter', 'nbconvert', '--to', 'script',
input_path, '--output', output_path])
def cleanup(path):
skip_lines_startwith = ('Image(filename=',
'# In[',
'# <hr>',
'from IPython.display import Image',
'get_ipython()',
'# <br>')
clean_content = []
imports = []
existing_imports = set()
with open(path, 'r') as f:
next(f)
next(f)
for line in f:
line = line.rstrip(' ')
if line.startswith(skip_lines_startwith):
continue
if line.startswith('import ') or (
'from ' in line and 'import ' in line):
if 'from __future__ import print_function' in line:
if line != imports[0]:
imports.insert(0, line)
else:
if line.strip() not in existing_imports:
imports.append(line)
existing_imports.add(line.strip())
else:
clean_content.append(line)
clean_content = ['# coding: utf-8\n\n\n'] + imports + clean_content
with open(path, 'w') as f:
for line in clean_content:
f.write(line)
if __name__ == '__main__':
parser = argparse.ArgumentParser(
description='Convert Jupyter notebook to Python script.',
formatter_class=argparse.RawTextHelpFormatter)
parser.add_argument('-i', '--input',
required=True,
help='Path to the Jupyter Notebook file')
parser.add_argument('-o', '--output',
required=True,
help='Path to the Python script file')
parser.add_argument('-v', '--version',
action='version',
version='v. 0.1')
args = parser.parse_args()
convert(input_path=args.input,
output_path=os.path.splitext(args.output)[0])
cleanup(args.output)