', '>\n<title>', s) # Different Pandas versions produce different CSS styles. s = re.sub(r'<style[ a-z]*>.*</style>', '<style>...</style>', s, flags=re.DOTALL) # CalledProcessError message has a final dot in Python 3.6 s = re.sub(r"(' returned non-zero exit status \d+)\.", r'\1', s) for n, p in enumerate(ignores): s = re.sub(p, 'IGN{}'.format(n), s) return s def canonical_dict(dict, ignores): '''Neutralize gratuitous differences in a Jupyter dictionary. For instance, neutralize different Graphviz layouts in SVG. ''' if 'text' in dict: dict['text'] = canonicalize(dict['text'], 'text', ignores) if 'data' in dict: for k in dict['data']: dict['data'][k] = canonicalize(dict['data'][k], k, ignores) if ('ename' in dict and dict['ename'] == 'SystemExit' and dict['evalue'] == '77'): # sys.exit(77) is used to Skip the test. sys.exit(77) if 'transient' in dict: del dict['transient'] if 'execution_count' in dict: del dict['execution_count'] if 'traceback' in dict: del dict['traceback'] return dict def compare_outputs(ref, test, ignores=[]): '''Check that two lists of outputs are equivalent and report the result.''' # There can be several outputs. For instance wnen the cell both # prints a result (goes to "stdout") and displays an automaton # (goes to "data"). exp = pprint.pformat([canonical_dict(d, ignores) for d in ref], width=132) eff = pprint.pformat([canonical_dict(d, ignores) for d in test], width=132) if exp[:-1] != '\n': exp += '\n' if eff[:-1] != '\n': eff += '\n' if exp == eff: return True else: print(''.join(diff(exp.splitlines(1), eff.splitlines(1), fromfile='expected', tofile='effective'))) return False def _wait_for_ready_backport(kc): """Backport BlockingKernelClient.wait_for_ready from IPython 3""" # Wait for kernel info reply on shell channel kc.kernel_info() while True: msg = kc.get_shell_msg(block=True, timeout=30) if msg['msg_type'] == 'kernel_info_reply': break # Flush IOPub channel while True: try: msg = kc.get_iopub_msg(block=True, timeout=0.2) except Empty: break def run_cell(kc, cell): kc.execute(cell.source) # wait for finish, maximum 20s reply = kc.get_shell_msg(timeout=20) outs = [] while True: try: msg = kc.get_iopub_msg(timeout=0.2) except Empty: break msg_type = msg['msg_type'] content = msg['content'] if msg_type == 'status' and content['execution_state'] == 'idle': break if msg_type in ('status', 'pyin', 'execute_input', 'comm_open', 'comm_msg'): continue if msg_type == 'stream': if 'Widget' in content['text']: continue # If the last stream had the same name, then outputs are # appended. if outs: last = outs[-1] if last['output_type'] == 'stream' and \ last['name'] == content['name']: last['text'] += content['text'] continue elif msg_type == 'clear_output': outs = [] continue content['output_type'] = msg_type outs.append(content) return outs def test_notebook(ipynb): with open(ipynb, encoding='utf-8') as f: nb = nbformat.reads_json(f.read()) km = KernelManager() # Do not save the history to disk, as it can yield spurious lock errors. # See https://github.com/ipython/ipython/issues/2845 km.start_kernel(extra_arguments=['--HistoryManager.hist_file=:memory:']) kc = km.client() kc.start_channels() try: kc.wait_for_ready() except AttributeError: _wait_for_ready_backport(kc) successes = 0 failures = 0 errors = 0 for i, cell in enumerate(nb.cells): if cell.cell_type != 'code' or cell.source.startswith('%timeit'): continue try: outs = run_cell(kc, cell) except Exception as e: print("failed to run cell:", repr(e)) print(cell.input) errors += 1 continue failed = False if len(outs) != len(cell.outputs): print("output length mismatch (expected {}, got {})".format( len(cell.outputs), len(outs))) failed = True if not compare_outputs(outs, cell.outputs): failed = True print("cell %d: " % i, end="") if failed: print("FAIL") failures += 1 else: print("OK") successes += 1 print("tested notebook %s" % ipynb) print(" %3i cells successfully replicated" % successes) if failures: print(" %3i cells mismatched output" % failures) if errors: print(" %3i cells failed to complete" % errors) kc.stop_channels() km.shutdown_kernel() del km if failures | errors: sys.exit(1) if __name__ == '__main__': for ipynb in sys.argv[1:]: print("testing %s" % ipynb) test

#!/usr/bin/env python """ simple example script for running and testing notebooks. Usage: `ipnbdoctest.py foo.ipynb [bar.ipynb [...]]` Each cell is submitted to the kernel, and the outputs are compared with those stored in the notebook. """ # Derived from https://gist.github.com/minrk/2620735 from __future__ import print_function import os,sys,time import base64 import re import pprint from difflib import unified_diff as diff from collections import defaultdict try: from queue import Empty except ImportError: print('Python 3.x is needed to run this script.') sys.exit(77) import importlib.util try: importlib.util.find_spec('IPython') except: print('IPython is needed to run this script.') sys.exit(77) try: from jupyter_client import KernelManager except ImportError: try: from IPython.kernel import KernelManager except ImportError: try: from IPython.zmq.blockingkernelmanager \ import BlockingKernelManager as KernelManager except: print('IPython is needed to run this script.') sys.exit(77) # Until Debian Stable ships IPython >3.0, we stick to the v3 format. try: from nbformat import v4 as nbformat except ImportError: from IPython.nbformat import v4 as nbformat def compare_png(a64, b64): """compare two b64 PNGs (incomplete)""" try: import Image except ImportError: pass adata = base64.decodestring(a64) bdata = base64.decodestring(b64) return True def canonicalize(s, type, ignores): """sanitize a string for comparison. fix universal newlines, strip trailing newlines, and normalize likely random values (memory addresses and UUIDs) """ if not isinstance(s, str): return s # normalize newline: s = s.replace('\r\n', '\n') # ignore trailing newlines (but not space) s = s.rstrip('\n') # remove hex addresses: s = re.sub(r'at 0x[a-f0-9]+', 'object', s) # normalize UUIDs: s = re.sub(r'[a-f0-9]{8}(\-[a-f0-9]{4}){3}\-[a-f0-9]{12}', 'U-U-I-D', s) # normalize graphviz version s = re.sub(r'Generated by graphviz version.*', 'VERSION', s) # remove Spins verbose output version s = re.sub(r'SpinS Promela Compiler.*Compiled C .* to .*pml.spins', 'SpinS output', s, flags=re.DOTALL) # %%file writes `Writing`, or `Overwriting` if the file exists. s = re.sub(r'^Overwriting ', 'Writing ', s) # SVG generated by graphviz may put note at different positions # depending on the graphviz build. Let's just strip anything that # look like a position. s = re.sub(r'', '>\n<title>', s) # Different Pandas versions produce different CSS styles. s = re.sub(r'<style[ a-z]*>.*</style>', '<style>...</style>', s, flags=re.DOTALL) # CalledProcessError message has a final dot in Python 3.6 s = re.sub(r"(' returned non-zero exit status \d+)\.", r'\1', s) for n, p in enumerate(ignores): s = re.sub(p, 'IGN{}'.format(n), s) return s def canonical_dict(dict, ignores): '''Neutralize gratuitous differences in a Jupyter dictionary. For instance, neutralize different Graphviz layouts in SVG. ''' if 'text' in dict: dict['text'] = canonicalize(dict['text'], 'text', ignores) if 'data' in dict: for k in dict['data']: dict['data'][k] = canonicalize(dict['data'][k], k, ignores) if ('ename' in dict and dict['ename'] == 'SystemExit' and dict['evalue'] == '77'): # sys.exit(77) is used to Skip the test. sys.exit(77) if 'transient' in dict: del dict['transient'] if 'execution_count' in dict: del dict['execution_count'] if 'traceback' in dict: del dict['traceback'] return dict def compare_outputs(ref, test, ignores=[]): '''Check that two lists of outputs are equivalent and report the result.''' # There can be several outputs. For instance wnen the cell both # prints a result (goes to "stdout") and displays an automaton # (goes to "data"). exp = pprint.pformat([canonical_dict(d, ignores) for d in ref], width=132) eff = pprint.pformat([canonical_dict(d, ignores) for d in test], width=132) if exp[:-1] != '\n': exp += '\n' if eff[:-1] != '\n': eff += '\n' if exp == eff: return True else: print(''.join(diff(exp.splitlines(1), eff.splitlines(1), fromfile='expected', tofile='effective'))) return False def _wait_for_ready_backport(kc): """Backport BlockingKernelClient.wait_for_ready from IPython 3""" # Wait for kernel info reply on shell channel kc.kernel_info() while True: msg = kc.get_shell_msg(block=True, timeout=30) if msg['msg_type'] == 'kernel_info_reply': break # Flush IOPub channel while True: try: msg = kc.get_iopub_msg(block=True, timeout=0.2) except Empty: break def run_cell(kc, cell): kc.execute(cell.source) # wait for finish, maximum 20s reply = kc.get_shell_msg(timeout=20) outs = [] while True: try: msg = kc.get_iopub_msg(timeout=0.2) except Empty: break msg_type = msg['msg_type'] content = msg['content'] if msg_type == 'status' and content['execution_state'] == 'idle': break if msg_type in ('status', 'pyin', 'execute_input', 'comm_open', 'comm_msg'): continue if msg_type == 'stream': if 'Widget' in content['text']: continue # If the last stream had the same name, then outputs are # appended. if outs: last = outs[-1] if last['output_type'] == 'stream' and \ last['name'] == content['name']: last['text'] += content['text'] continue elif msg_type == 'clear_output': outs = [] continue content['output_type'] = msg_type outs.append(content) return outs def test_notebook(ipynb): with open(ipynb, encoding='utf-8') as f: nb = nbformat.reads_json(f.read()) km = KernelManager() # Do not save the history to disk, as it can yield spurious lock errors. # See https://github.com/ipython/ipython/issues/2845 km.start_kernel(extra_arguments=['--HistoryManager.hist_file=:memory:']) kc = km.client() kc.start_channels() try: kc.wait_for_ready() except AttributeError: _wait_for_ready_backport(kc) successes = 0 failures = 0 errors = 0 for i, cell in enumerate(nb.cells): if cell.cell_type != 'code' or cell.source.startswith('%timeit'): continue try: outs = run_cell(kc, cell) except Exception as e: print("failed to run cell:", repr(e)) print(cell.input) errors += 1 continue failed = False if len(outs) != len(cell.outputs): print("output length mismatch (expected {}, got {})".format( len(cell.outputs), len(outs))) failed = True if not compare_outputs(outs, cell.outputs): failed = True print("cell %d: " % i, end="") if failed: print("FAIL") failures += 1 else: print("OK") successes += 1 print("tested notebook %s" % ipynb) print(" %3i cells successfully replicated" % successes) if failures: print(" %3i cells mismatched output" % failures) if errors: print(" %3i cells failed to complete" % errors) kc.stop_channels() km.shutdown_kernel() del km if failures | errors: sys.exit(1) if __name__ == '__main__': for ipynb in sys.argv[1:]: print("testing %s" % ipynb) test_notebook(ipynb)