doc/hackathon/converttonotebook_8py_source.html

#!/usr/bin/env python

# Author: Pau Miquel i Mir <pau.miquel.mir@cern.ch> <pmm1g15@soton.ac.uk>>

# Date: July, 2016

#

# DISCLAIMER: This script is a prototype and a work in progress. Indeed, it is possible that

# it may not work for certain tutorials, and that it, or the tutorial, might need to be

# tweaked slightly to ensure full functionality. Please do not hesitate to email the author

# with any questions or with examples that do not work.

#

# HELP IT DOESN'T WORK: Two possible solutions:

#     1. If the tutorial takes a long time to execute (more than 90 seconds), add the name of the

#        tutorial to the list of long tutorials listLongTutorials, in the function findTimeout.

#     2. Check that helper functions are recognised correctly in split(text).

#

# REQUIREMENTS: This script needs jupyter to be properly installed, as it uses the python

# package nbformat and calls the shell commands `jupyter nbconvert` and `jupyter trust`. The

# rest of the packages used should be included in a standard installation of python. The script

# is intended to be run on a UNIX based system.

#

#

# FUNCTIONING:

# -----------

# The converttonotebook script creates Jupyter notebooks from raw C++ or python files.

# Particularly, it is indicated to convert the ROOT tutorials found in the ROOT

# repository.

#

# The script should be called from bash with the following format:

#      python /path/to/script/converttonotebook.py /path/to/<macro>.C /path/to/outdir

#

# Indeed the script takes two arguments, the path to the macro and the path to the directory

# where the notebooks will be created

#

# The script's general functioning is as follows. The macro to be converted is imported as a string.

# A series of modifications are made to this string, for instance delimiting where markdown and

# code cells begin and end. Then, this string is converted into ipynb format using a function

# in the nbconvert package. Finally, the notebook is executed and output.

#

# For converting python tutorials it is fairly straightforward. It extracts the description and

# author information from the header and then removes it. It also converts any comment at the

# beginning of a line into a Markdown cell.

#

# For C++ files the process is slightly more complex. The script separates the functions from the

# main code. The main function is identified as it has the same name as the macro file. The other

# functions are considered functions. The main function is "extracted" and presented as main code.

# The helper functions are placed in their own code cell with the %%cpp -d magic to enable function

# defintion. Finally, as with Python macros, relevant information is extracted from the header, and

# newline comments are converted into Markdown cells (unless they are in helper functions).

#

# The script creates an .ipynb version of the macro,  with the full output included.

# The files are named:

#     <macro>.<C or py>.nbconvert.ipynb

#

# It is called by filter.cxx, which in turn is called by doxygen when processing any file

# in the ROOT repository. filter.cxx only calls convertonotebook.py when the string \notebook

# is found in the header of the tutorial, but this script checks for its presence as well.


import re

import os

import sys

import json

import time

import doctest

import textwrap

import subprocess

from nbformat import v3, v4

from datetime import datetime, date

import statistics


# -------------------------------------

# -------- Function definitions--------

# -------------------------------------


def unindenter(string, spaces = 3):

    """

    Returns string with each line unindented by 3 spaces. If line isn't indented, it stays the same.

    >>> unindenter("   foobar")

    'foobar\\n'

    >>> unindenter("foobar")

    'foobar\\n'

    >>> unindenter('''foobar

    ...    foobar

    ... foobar''')

    'foobar\\nfoobar\\nfoobar\\n'

    """

    newstring = ''

    lines = string.splitlines()

    for line in lines:

        if line.startswith(spaces*' '):

            newstring += (line[spaces:] + "\n")

        else:

            newstring += (line + "\n")


    return newstring


def measureIndentation(text):

    """Measure the indentation width"""

    nSpaces = sorted({len(line) - len(line.lstrip()) for line in text.splitlines() if line.strip()})

    return nSpaces[0] if nSpaces[0] != 0 or len(nSpaces) == 1 else nSpaces[1]


def readHeaderPython(text):

    """

    Extract author and description from header, eliminate header from text. Also returns

    notebook boolean, which is True if the string \notebook is present in the header

    Also determine options (-js, -nodraw, -header) passed in \notebook command, and

    return their booleans

    >>> readHeaderPython('''## \\file

    ... ## \\ingroup tutorials

    ... ## \\\\notebook

    ... ## This is the description of the tutorial

    ... ##

    ... ## \\macro_image

    ... ## \\macro_code

    ... ##

    ... ## \\\\author John Brown

    ... def tutorialfuncion()''')

    ('def tutorialfuncion()\\n', 'This is the description of the tutorial\\n\\n\\n', 'John Brown', True, False, False, False)

    >>> readHeaderPython('''## \\file

    ... ## \\ingroup tutorials

    ... ## \\\\notebook -js

    ... ## This is the description of the tutorial

    ... ##

    ... ## \\macro_image

    ... ## \\macro_code

    ... ##

    ... ## \\\\author John Brown

    ... def tutorialfuncion()''')

    ('def tutorialfuncion()\\n', 'This is the description of the tutorial\\n\\n\\n', 'John Brown', True, True, False, False)

    >>> readHeaderPython('''## \\file

    ... ## \\ingroup tutorials

    ... ## \\\\notebook -nodraw

    ... ## This is the description of the tutorial

    ... ##

    ... ## \\macro_image

    ... ## \\macro_code

    ... ##

    ... ## \\\\author John Brown

    ... def tutorialfuncion()''')

    ('def tutorialfuncion()\\n', 'This is the description of the tutorial\\n\\n\\n', 'John Brown', True, False, True, False)

    """

    lines = text.splitlines()


    description = ''

    author = ''

    isNotebook = False

    isJsroot = False

    nodraw = False

    needsHeaderFile = False

    for i, line in enumerate(lines):

        if line.startswith("## \\aut"):

            author = line[11:]

        elif line.startswith("## \\note"):

            isNotebook = True

            if "-js" in line:

                isJsroot = True

            if "-nodraw" in line:

                nodraw = True

            if "-header" in line:

                needsHeaderFile = True

        elif line.startswith("##"):

            if not line.startswith("## \\") and isNotebook:

                description += (line[3:] + '\n')

        else:

            break

    newtext = ''

    for line in lines[i:]:

        newtext += (line + "\n")


    return newtext, description, author, isNotebook, isJsroot, nodraw, needsHeaderFile


def pythonComments(text):

    """

    Converts comments delimited by # or ## and on a new line into a markdown cell.

    For python files only

    >>> pythonComments('''## This is a

    ... ## multiline comment

    ... def function()''')

    '# <markdowncell>\\n## This is a\\n## multiline comment\\n# <codecell>\\ndef function()\\n'

    >>> pythonComments('''def function():

    ...     variable = 5 # Comment not in cell

    ...     # Comment also not in cell''')

    'def function():\\n    variable = 5 # Comment not in cell\\n    # Comment also not in cell\\n'

    """

    text = text.splitlines()

    newtext = ''

    inComment = False

    for i, line in enumerate(text):

        if line.startswith("#") and not inComment:  # True if first line of comment

            inComment = True

            newtext += "# <markdowncell>\n"

            newtext += (line + "\n")

        elif inComment and not line.startswith("#"):  # True if first line after comment

            inComment = False

            newtext += "# <codecell>\n"

            newtext += (line+"\n")

        else:

            newtext += (line+"\n")

    return newtext


def pythonMainFunction(text):

    lines = text.splitlines()

    functionContentRe = re.compile('def %s\\(.*\\):' % tutName , flags = re.DOTALL | re.MULTILINE)

    newtext = ''

    inMainFunction = False

    hasMainFunction = False

    for line in lines:


        if hasMainFunction:

            if line.startswith("""if __name__ == "__main__":""") or line.startswith("""if __name__ == '__main__':"""):

                break

        match = functionContentRe.search(line)

        if inMainFunction and not line.startswith("    ") and line != "":

            inMainFunction = False

        if match:

            inMainFunction = True

            hasMainFunction = True

        else:

            if inMainFunction:

                newtext += (line[4:] + '\n')

            else:

                newtext += (line + '\n')

    return newtext


def convertDoxygenLatexToMarkdown(text):

    """Replace formula tags used by doxygen to the ones used in notebooks."""

    text = text.replace("\\f$", "$")

    text = text.replace("\\f[", "$$")

    text = text.replace("\\f]", "$$")

    return text


def readHeaderCpp(text):

    """

    Extract author and description from header, eliminate header from text. Also returns

    notebook boolean, which is True if the string \notebook is present in the header

    Also determine options (-js, -nodraw, -header) passed in \notebook command, and

    return their booleans

    >>> readHeaderCpp('''/// \\file

    ... /// \\ingroup tutorials

    ... /// \\\\notebook

    ... /// This is the description of the tutorial

    ... ///

    ... /// \\macro_image

    ... /// \\macro_code

    ... ///

    ... /// \\\\author John Brown

    ... void tutorialfuncion(){}''')

    ('void tutorialfuncion(){}\\n', '# This is the description of the tutorial\\n# \\n# \\n', 'John Brown', True, False, False, False)

    >>> readHeaderCpp('''/// \\file

    ... /// \\ingroup tutorials

    ... /// \\\\notebook -js

    ... /// This is the description of the tutorial

    ... ///

    ... /// \\macro_image

    ... /// \\macro_code

    ... ///

    ... /// \\\\author John Brown

    ... void tutorialfuncion(){}''')

    ('void tutorialfuncion(){}\\n', '# This is the description of the tutorial\\n# \\n# \\n', 'John Brown', True, True, False, False)

    >>> readHeaderCpp('''/// \\file

    ... /// \\ingroup tutorials

    ... /// \\\\notebook -nodraw

    ... /// This is the description of the tutorial

    ... ///

    ... /// \\macro_image

    ... /// \\macro_code

    ... ///

    ... /// \\\\author John Brown

    ... void tutorialfuncion(){}''')

    ('void tutorialfuncion(){}\\n', '# This is the description of the tutorial\\n# \\n# \\n', 'John Brown', True, False, True, False)

    """

    lines = text.splitlines()


    description = ''

    author = ''

    isNotebook = False

    isJsroot = False

    nodraw = False

    needsHeaderFile = False

    for i, line in enumerate(lines):

        if line.startswith("/// \\aut"):

            author = line[12:]

        if line.startswith("/// \\note"):

            isNotebook = True

            if "-js" in line:

                isJsroot = True

            if "-nodraw" in line:

                nodraw = True

            if "-header" in line:

                needsHeaderFile = True

        if line.startswith("///"):

            if not line.startswith("/// \\") and isNotebook:

                description += ('# ' + line[4:] + '\n')

        else:

            break

    newtext = ''

    for line in lines[i:]:

        newtext += (line + "\n")

    description = convertDoxygenLatexToMarkdown(description)

    return newtext, description, author, isNotebook, isJsroot, nodraw, needsHeaderFile


def cppFunction(text):

    """

    Extracts main function for the function enclosure by means of regular expression

    >>> cppFunction('''void mainfunction(arguments = values){

    ...    content of function

    ...    which spans

    ...    several lines

    ... }''')

    '\\n   content of function\\n   which spans\\n   several lines\\n'

    >>> cppFunction('''void mainfunction(arguments = values)

    ... {

    ...    content of function

    ...    which spans

    ...    several lines

    ... }''')

    '\\n   content of function\\n   which spans\\n   several lines\\n'

    >>> cppFunction('''void mainfunction(arguments = values

    ... morearguments = morevalues)

    ... {

    ...    content of function

    ...    which spans

    ...    several lines

    ... }''')

    '\\n   content of function\\n   which spans\\n   several lines\\n'

    """

    functionContentRe = re.compile(r'(?<=\{).*(?=^\})', flags = re.DOTALL | re.MULTILINE)


    match = functionContentRe.search(text)


    if match:

        return match.group()

    else:

        return text


def cppComments(text):

    """

    Converts comments delimited by // and on a new line into a markdown cell. Skips comments inside

    blocks and braces, though, since these would otherwise be ripped apart. For C++ files only.

    >>> cppComments('''// This is a

    ... // multiline comment

    ... void function(){}''')

    '# <markdowncell>\\n# This is a\\n#  multiline comment\\n# <codecell>\\nvoid function(){}\\n'

    >>> cppComments('''void function(){

    ...    int variable = 5 // Comment not in cell

    ...    // Comment also not in cell

    ... }''')

    'void function(){\\n   int variable = 5 // Comment not in cell\\n   // Comment also not in cell\\n}\\n'

    """

    newtext = ''

    inComment = False

    curlyDepth = 0

    braceDepth = 0


    for line in text.splitlines():


        if line.strip().startswith("//") and curlyDepth == 0 and braceDepth == 0:

            line = line.strip(" /")


            # Allow for doxygen-style latex:

            line = convertDoxygenLatexToMarkdown(line)


            if not inComment:  # True if first line of comment

                inComment = True

                newtext += "# <markdowncell>\n\n"

            newtext += ("# " + line + "\n")

        else:

            for char in line:

                if char == "(":

                    braceDepth += 1

                elif char == ")":

                    braceDepth -= 1

                elif char == "{":

                    curlyDepth += 1

                elif char == "}":

                    curlyDepth -= 1


            if inComment:  # True if first line after comment

                inComment = False

                newtext += "# <codecell>\n"


            newtext += (line+"\n")


    return newtext


def findBracedBlock(text, startpos, openingBraceChar):

    """

    Scan the string in <text>, starting at <startpos>. Return index of opening and

    matching closing brace if present. The brace to search for is passed in <openingBraceChar>,

    e.g. '(', '{', '['.

    """

    depth = 0

    braceRegex = {"<": r"[<>]", "(": r"[()]", "{": r"[{}]", "[": r"[[]]"}

    if openingBraceChar not in braceRegex:

        raise ValueError("Brace character " + openingBraceChar + " doesn't seem to be an opening brace")


    begin = None

    bracketRe = re.compile(braceRegex[openingBraceChar], flags = re.DOTALL | re.MULTILINE)


    while True:

        lastMatch = bracketRe.search(text, startpos)

        if lastMatch:

            if begin is None:

                if lastMatch.group() != openingBraceChar:

                    raise ValueError("Found " + lastMatch.group() + " while looking for opening brace in\n" + text[pos:])

                begin = lastMatch.start()


            depth += 1 if lastMatch.group(0) == openingBraceChar else -1

            startpos = lastMatch.end()


            if depth == 0:

                ret = (begin,lastMatch.end()-1)

                begin = None

                yield ret

        elif depth == 0:

            return

        else:

            raise ValueError("Unmatched " + braceRegex[openingBraceChar] + " at " + text[startpos-15:startpos+15])


def findStuffBeforeFunc(text, searchStart, searchEnd):

    beforeFunctionRe = re.compile("(;|}|//[^\n]*)\s*$", flags = re.MULTILINE)

    try:

        # Find the last '}' or comment line etc before function definition:

        lastMatchBeforeFunc = [thisMatch for thisMatch in beforeFunctionRe.finditer(text, searchStart, searchEnd)][-1]

        return lastMatchBeforeFunc.end()+1

    except IndexError as e:

        return searchStart


def split(text):

    """

    Splits the text string into main, helpers, and rest. main is the main function,

    i.e. the function with the same name as the macro file. Helpers is a list of

    strings, each a helper function, i.e. any other function that is not the main function.

    Finally, rest is a string containing any top-level code/declarations outside of any function.

    Comments above a function will be converted to a markdown cell in notebooks.

    Intended for C++ files only.

    >>> split('''void tutorial(){

    ...    content of tutorial

    ... }''')

    ('void tutorial(){\\n   content of tutorial\\n}', [], '')

    >>> split('''void tutorial(){

    ...    content of tutorial

    ... }

    ... void helper(arguments = values){

    ...    helper function

    ...    content spans lines

    ... }''')

    ('void tutorial(){\\n   content of tutorial\\n}', ['\\n# <markdowncell>\\n A helper function is created: \\n# <codecell>\\n%%cpp -d\\nvoid helper(arguments = values){\\n   helper function\\n   content spans lines\\n}'], '')

    >>> split('''#include <header.h>

    ... using namespace NAMESPACE

    ... void tutorial(){

    ...    content of tutorial

    ... }

    ... void helper(arguments = values){

    ...    helper function

    ...    content spans lines

    ... }''')

    ('void tutorial(){\\n   content of tutorial\\n}', ['\\n# <markdowncell>\\n A helper function is created: \\n# <codecell>\\n%%cpp -d\\nvoid helper(arguments = values){\\n   helper function\\n   content spans lines\\n}'], '#include <header.h>\\nusing namespace NAMESPACE')

    >>> split('''void tutorial(){

    ...    content of tutorial

    ... }

    ... // This is a multiline

    ... // description of the

    ... // helper function

    ... void helper(arguments = values){

    ...    helper function

    ...    content spans lines

    ... }''')

    ('void tutorial(){\\n   content of tutorial\\n}', ['\\n# <markdowncell>\\n  This is a multiline\\n description of the\\n helper function\\n \\n# <codecell>\\n%%cpp -d\\nvoid helper(arguments = values){\\n   helper function\\n   content spans lines\\n}'], '')

    """

    functionRe = re.compile(r"[^(/;]*?\s+[*&]*([\w:]+)\s*\‍(", flags = re.DOTALL | re.MULTILINE)

    tailRe = re.compile(r"}\s*;?", flags = re.DOTALL | re.MULTILINE)

    helpers = []

    definitions = []

    main = ""

    searchStart = 0

    for curlyBegin,curlyEnd in findBracedBlock(text, 0, "{"):

        functionMatches = [match for match in functionRe.finditer(text, searchStart, curlyBegin)]


        tailMatch = tailRe.match(text, curlyEnd)

        if tailMatch:

            curlyEnd = tailMatch.end()

        else:

            sys.stderr.write("Failed match on " + text[curlyEnd:curlyEnd+10])


        if not functionMatches:

            definitions.append("%%cpp -d\n" + text[searchStart:curlyEnd])

            searchStart = curlyEnd+1

            continue


        functionMatch = functionMatches[-1]

        startpos = functionMatch.start()

        # Search for function arguments

        roundBegin,roundEnd = next( findBracedBlock(text, functionMatch.end()-2, "(") )

        if roundEnd > curlyBegin:

            raise RuntimeError("Didn't find '()' before '{}'")


        beforeFuncPos = findStuffBeforeFunc(text, searchStart, functionMatch.start(1))

        stuffBeforeFunc = text[searchStart:beforeFuncPos]

        funcString = text[beforeFuncPos:curlyEnd]

        searchStart = curlyEnd


        commentLines = []

        for line in stuffBeforeFunc.splitlines():

            if line.strip().startswith("//"):

                commentLines.append(line)

            else:

                definitions.append(line)


        if tutName == functionMatch.group(1).strip():  # if the name of the function is that of the macro

            main = funcString

        else:

            helpers.append((funcString, functionMatch.group(1).strip(), commentLines))


    newHelpers = []

    for helper,functionName,commentLines in helpers:      # For each helper function

        helper = helper.rstrip(" \n")

        helperDescription = ""

        for line in commentLines:

            helper = helper.replace(line, "")

            if line.strip() in ["//", "///"]:

                # Convert empty comment lines to markdown breaks

                helperDescription += "\n\n"

            else:

                helperDescription += line.strip(" /*") + "\n"

        if len(helperDescription) == 0:   # If no comments are found create generic description

            helperDescription = "Definition of a helper function:"


        if functionName != "main":  # remove void main function

            newHelpers.append("\n# <markdowncell>\n " + helperDescription + " \n# <codecell>\n%%cpp -d\n" + helper)


    return main, newHelpers, "\n".join(definitions)


def processmain(text):

    """

    Evaluates whether the main function returns a TCanvas or requires input. If it

    does then the keepfunction flag is True, meaning the function wont be extracted

    by cppFunction. If the initial condition is true then an extra cell is added

    before at the end that calls the main function is returned, and added later.

    >>> processmain('''void function(){

    ...    content of function

    ...    spanning several

    ...    lines

    ... }''')

    ('void function(){\\n   content of function\\n   spanning several\\n   lines\\n}', '')

    >>> processmain('''void function(arguments = values){

    ...    content of function

    ...    spanning several

    ...    lines

    ... }''')

    ('void function(arguments = values){\\n   content of function\\n   spanning several\\n   lines\\n}', '# <markdowncell> \\n Arguments are defined. \\n# <codecell>\\narguments = values;\\n# <codecell>\\n')

    >>> processmain('''void function(argument1 = value1, //comment 1

    ...                              argument2 = value2 /*comment 2*/ ,

    ...                              argument3 = value3,

    ...                              argument4 = value4)

    ... {

    ...    content of function

    ...    spanning several

    ...    lines

    ... }''')

    ('void function(argument1 = value1, //comment 1\\n                             argument2 = value2 /*comment 2*/ ,\\n                             argument3 = value3, \\n                             argument4 = value4)\\n{\\n   content of function\\n   spanning several\\n   lines\\n}', '# <markdowncell> \\n Arguments are defined. \\n# <codecell>\\nargument1 = value1;\\nargument2 = value2;\\nargument3 = value3;\\nargument4 = value4;\\n# <codecell>\\n')

    >>> processmain('''TCanvas function(){

    ...    content of function

    ...    spanning several

    ...    lines

    ...    return c1

    ... }''')

    ('TCanvas function(){\\n   content of function\\n   spanning several \\n   lines\\n   return c1\\n}', '')

    """


    argumentsCell = ''


    if text:

        argumentsre = re.compile(r'(?<=\‍().*?(?=\‍))', flags = re.DOTALL | re.MULTILINE)

        arguments = argumentsre.search(text)


        if len(arguments.group()) > 3:

            argumentsCell = "# <markdowncell> \n Arguments are defined. \n# <codecell>\n"

            individualArgumentre = re.compile(r'[^/\n,]*?=[^/\n,]*') #, flags = re.DOTALL) #| re.MULTILINE)

            argumentList=individualArgumentre.findall(arguments.group())

            for argument in argumentList:

                argumentsCell += argument.strip("\n ") + ";\n"

            argumentsCell += "# <codecell>\n"


    return text, argumentsCell


# now define text transformers


def removePaletteEditor(code):

    code = code.replace("img->StartPaletteEditor();", "")

    code = code.replace("Open the color editor", "")

    return code


def runEventExe(code):

    if "copytree" in tutName:

        return "# <codecell> \n.! $ROOTSYS/test/eventexe 1000 1 1 1 \n" + code

    return code


def getLibMathMore(code):

    if "quasirandom" == tutName:

        return "# <codecell> \ngSystem->Load(\"libMathMore\"); \n# <codecell> \n" + code

    return code


def roofitRemoveSpacesComments(code):


    def changeString(matchObject):

        matchString = matchObject.group()

        matchString = matchString[0]  + " " + matchString[1:]

        matchString = matchString.replace("  " , "THISISASPACE")

        matchString = matchString.replace(" " , "")

        matchString = matchString.replace("THISISASPACE" , " ")

        return matchString


    newcode = re.sub("#\s\s?\w\s[\w-]\s\w.*", changeString , code)

    return newcode


def declareNamespace(code):

    if "using namespace RooFit;\nusing namespace RooStats;" in code:

        code = code.replace("using namespace RooFit;\nusing namespace RooStats;", "# <codecell>\n%%cpp -d\n// This is a workaround to make sure the namespace is used inside functions\nusing namespace RooFit;\nusing namespace RooStats;\n# <codecell>\n")


    else:

        code = code.replace("using namespace RooFit;", "# <codecell>\n%%cpp -d\n// This is a workaround to make sure the namespace is used inside functions\nusing namespace RooFit;\n# <codecell>\n")

        code = code.replace("using namespace RooStats;", "# <codecell>\n%%cpp -d\n// This is a workaround to make sure the namespace is used inside functions\nusing namespace RooStats;\n# <codecell>\n")

        code = code.replace("using namespace ROOT::Math;", "# <codecell>\n%%cpp -d\n// This is a workaround to make sure the namespace is used inside functions\nusing namespace ROOT::Math;\n# <codecell>\n")


    return code


def rs401dGetFiles(code):

    if tutName == "rs401d_FeldmanCousins":

        code = code.replace(

         """#include "../tutorials/roofit/roostats/NuMuToNuE_Oscillation.h"\n#include "../tutorials/roofit/roostats/NuMuToNuE_Oscillation.cxx" // so that it can be executed directly\n#else\n#include "../tutorials/roofit/roostats/NuMuToNuE_Oscillation.cxx+" // so that it can be executed directly\n""" , """TString tutDir = gROOT->GetTutorialDir();\nTString headerDir = TString::Format("#include \\\"%s/roostats/NuMuToNuE_Oscillation.h\\\"", tutDir.Data());\nTString impDir = TString::Format("#include \\\"%s/roostats/NuMuToNuE_Oscillation.cxx\\\"", tutDir.Data());\ngROOT->ProcessLine(headerDir);\ngROOT->ProcessLine(impDir);""")

    return code


def declareIncludes(code):

    if tutName != "fitcont":

        code = re.sub(r"# <codecell>\s*#include", "# <codecell>\n%%cpp -d\n#include" , code)

    return code


def tree4GetFiles(code):

    if tutName == "tree4":

        code = code.replace(

         """#include \"../test/Event.h\"""" , """# <codecell>\nTString dir = "$ROOTSYS/test/Event.h";\ngSystem->ExpandPathName(dir);\nTString includeCommand = TString::Format("#include \\\"%s\\\"" , dir.Data());\ngROOT->ProcessLine(includeCommand);""")

    return code


def disableDrawProgressBar(code):

    code = code.replace(":DrawProgressBar",":!DrawProgressBar")

    return code


def fixes(code):

    codeTransformers=[removePaletteEditor, runEventExe, getLibMathMore,

        roofitRemoveSpacesComments,

        #declareNamespace,

        rs401dGetFiles,

        declareIncludes, tree4GetFiles, disableDrawProgressBar]


    for transformer in codeTransformers:

        code = transformer(code)


    return code


def changeMarkdown(code):

    code = code.replace("~~~" , "```")

    code = code.replace("{.cpp}", "cpp")

    code = code.replace("{.bash}", "bash")

    return code


def isCpp():

    """

    Return True if extension is a C++ file

    """

    return extension in ("C", "c", "cpp", "C++", "cxx")


def findTimeout():

   if tutName in ["OneSidedFrequentistUpperLimitWithBands",

       "StandardBayesianNumericalDemo",

       "TwoSidedFrequentistUpperLimitWithBands",

       "HybridStandardForm",

       "rs401d_FeldmanCousins",

       "TMVAMultipleBackgroundExample",

       "TMVARegression",

       "TMVAClassification",

       "StandardHypoTestDemo"]:

      return 900

   elif tutName in ["df103_NanoAODHiggsAnalysis"]:

      return 1200

   else:

      return 120


# -------------------------------------

# ------------ Main Program------------

# -------------------------------------


def mainfunction(text):

    """

    Main function. Calls all other functions, depending on whether the macro input is in python or c++.

    It adds the header information. Also, it adds a cell that draws all canvases. The working text is

    then converted to a version 3 jupyter notebook, subsequently updated to a version 4. Then, metadata

    associated with the language the macro is written in is attatched to he notebook. Finally the

    notebook is executed and output as a Jupyter notebook.

    """

    # Modify text from macros to suit a notebook

    if isCpp():

        try:

            main, helpers, rest = split(text)

            main,  argumentsCell = processmain(main)

            funcText = cppFunction(main)

            main = cppComments(unindenter(funcText, measureIndentation(funcText)))  # Remove function, Unindent, and convert comments to Markdown cells


            if argumentsCell:

                main = argumentsCell + main


            rest = cppComments(rest)  # Convert top level code comments to Markdown cells


            # Construct text by starting with top level code, then the helper functions, and finally the main function.

            # Also add cells for headerfile, or keepfunction

            if needsHeaderFile:

                text = "# <markdowncell>\n# The header file must be copied to the current directory\n# <codecell>\n.!cp %s%s.h .\n# <codecell>\n" % (tutRelativePath, tutName)

                text += rest

            else:

                text = "# <codecell>\n" + rest


            for helper in helpers:

                text += helper


            text += ("\n# <codecell>\n" + main)

        except Exception as e:

            sys.stderr.write("Failed to convert C++ to notebook\n" + str(e))

            raise e


    if extension == "py":

        text = pythonMainFunction(text)

        text = pythonComments(text)  # Convert comments into Markdown cells


    # Perform last minute fixes to the notebook, used for specific fixes needed by some tutorials

    text = fixes(text)


    # Change to standard Markdown

    newDescription = changeMarkdown(description)


    # Add the title and header of the notebook

    text = "# <markdowncell> \n# # %s\n%s# \n# \n# **Author:** %s  \n# <i><small>This notebook tutorial was automatically generated " \

        "with <a href= \"https://github.com/root-project/root/blob/master/documentation/doxygen/converttonotebook.py\">ROOTBOOK-izer</a> " \

        "from the macro found in the ROOT repository  on %s.</small></i>\n# <codecell>\n%s" % (tutTitle, newDescription, author, date, text)


    # Add cell at the end of the notebook that draws all the canvasses. Add a Markdown cell before explaining it.

    if isJsroot and not nodraw:

        if isCpp():

            text += "\n# <markdowncell> \n# Draw all canvases \n# <codecell>\n%jsroot on\ngROOT->GetListOfCanvases()->Draw()"

        if extension == "py":

            text += "\n# <markdowncell> \n# Draw all canvases \n# <codecell>\n%jsroot on\nfrom ROOT import gROOT \ngROOT.GetListOfCanvases().Draw()"


    elif not nodraw:

        if isCpp():

            text += "\n# <markdowncell> \n# Draw all canvases \n# <codecell>\ngROOT->GetListOfCanvases()->Draw()"

        if extension == "py":

            text += "\n# <markdowncell> \n# Draw all canvases \n# <codecell>\nfrom ROOT import gROOT \ngROOT.GetListOfCanvases().Draw()"


    # Create a notebook from the working text

    nbook = v3.reads_py(text)

    nbook = v4.upgrade(nbook)  # Upgrade v3 to v4


    # Load notebook string into json format, essentially creating a dictionary

    json_data = json.loads(v4.writes(nbook))


    # add the corresponding metadata

    if extension == "py":

        json_data['metadata'] = {

            "kernelspec": {

                "display_name": "Python " + str(sys.version_info[0]),

                "language": "python",

                "name": "python" + str(sys.version_info[0])

            },

            "language_info": {

                "codemirror_mode": {

                    "name": "ipython",

                    "version": 2

                },

                "file_extension": ".py",

                "mimetype": "text/x-python",

                "name": "python",

                "nbconvert_exporter": "python",

                "pygments_lexer": "ipython2",

                "version": "2.7.10"

            }

        }

    elif isCpp():

        json_data['metadata'] = {

            "kernelspec": {

                "display_name": "ROOT C++",

                "language": "c++",

                "name": "root"

            },

            "language_info": {

                "codemirror_mode": "text/x-c++src",

                "file_extension": ".C",

                "mimetype": " text/x-c++src",

                "name": "c++"

            }

        }


    # write the json file with the metadata

    with open(outPathName, 'w') as fout:

        json.dump(json_data, fout, indent=1, sort_keys=True)


    timeout = findTimeout()


    # Call commmand that executes the notebook and creates a new notebook with the output

    r = subprocess.call(["jupyter", "nbconvert", "--ExecutePreprocessor.timeout={}".format(timeout), "--to=notebook", "--execute", outPathName])

    retry = 0

    while r != 0 and retry < 2:

        # Work around glitches in NB conversion

        retry += 1

        r = subprocess.call(["jupyter", "nbconvert", "--ExecutePreprocessor.timeout={}".format(timeout*2), "--to=notebook", "--execute", outPathName])


    if r != 0:

        sys.stderr.write("NOTEBOOK_CONVERSION_WARNING: Nbconvert failed for notebook %s with return code %s\n" %(outPathName,r))

        # If notebook conversion did not work, try again without the option --execute

        if subprocess.call(["jupyter", "nbconvert", "--ExecutePreprocessor.timeout={}".format(timeout),  "--to=notebook",  outPathName]) != 0:

            raise RuntimeError("NOTEBOOK_CONVERSION_WARNING: Nbconvert failed for notebook %s with return code %s\n" %(outname,r))

    else:

        if isJsroot:

            subprocess.call(["jupyter", "trust",  os.path.join(outdir, outnameconverted)])

        # Only remove notebook without output if nbconvert succeeds

        os.remove(outPathName)


    return r


if __name__ == "__main__":


    if str(sys.argv[1]) == "-test":

        tutName = "tutorial"

        doctest.testmod(verbose=True)


    else:

        # -------------------------------------

        # ----- Preliminary definitions--------

        # -------------------------------------


        # Extract and define the name of the file as well as its derived names

        tutPathName = str(sys.argv[1])

        tutPath = os.path.dirname(tutPathName)

        if tutPath.split("/")[-2] == "tutorials":

            tutRelativePath = "$ROOTSYS/tutorials/%s/" % tutPath.split("/")[-1]

        tutFileName = os.path.basename(tutPathName)

        tutName, extension = tutFileName.split(".")

        #tutTitle = re.sub( r"([A-Z\d])", r" \1", tutName).title()

        tutTitle = tutName

        outname = tutFileName + ".ipynb"

        outnameconverted = tutFileName + ".nbconvert.ipynb"


        # Extract output directory

        try:

            outdir = str(sys.argv[2])

        except:

            outdir = tutPath


        outPathName = os.path.join(outdir, outname)

        # Find and define the time and date this script is run

        date = datetime.now().strftime("%A, %B %d, %Y at %I:%M %p")


        # -------------------------------------

        # -------------------------------------

        # -------------------------------------


        # Set DYLD_LIBRARY_PATH. When run without root access or as a different user, especially from Mac systems,

        # it is possible for security reasons that the environment does not include this definition, so it is manually defined.

        os.environ["DYLD_LIBRARY_PATH"] = os.environ["ROOTSYS"] + "/lib"


        # Open the file to be converted

        with open(tutPathName) as fin:

            text = fin.read()


        # Extract information from header and remove header from text

        if extension == "py":

            text, description, author, isNotebook, isJsroot, nodraw, needsHeaderFile = readHeaderPython(text)

        elif isCpp():

            text, description, author, isNotebook, isJsroot, nodraw, needsHeaderFile = readHeaderCpp(text)


        if isNotebook:

            starttime = time.time()

            try:

                ret = mainfunction(text)

            except Exception as e:

                print("Failed to convert to notebook", outPathName)

                raise e

            print("Notebook {0} run time".format(tutFileName), time.time() - starttime)


            sys.exit(ret)

converttonotebook.unindenter
unindenter(string, spaces=3)
Returns string with each line unindented by 3 spaces.
Definition converttonotebook.py:74