tonyfast · October 26, 2022 08:03 · tony · Jul 17, 2022 · tonyfast · Jul 18, 2022
diff --git a/doctest-myst.ipynb b/doctest-myst.ipynb
 {
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Adding doctests to the markdown it lexer and the docutils renderer in the myst the stack."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "    import markdown_it, docutils.nodes, myst_parser.docutils_renderer"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Create a lexing rule for markdown_it for doctests."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "    def doctest(state, startLine, endLine, silent, *, offset=0, continuation=True):\n",
    "        nextLine, start, maximum = startLine, state.bMarks[startLine] + state.tShift[startLine], state.eMarks[startLine]\n",
    "        \n",
    "        if not state.src[start:maximum].startswith(\">>> \"): return False\n",
    "        while nextLine < endLine:        \n",
    "            nextLine += 1\n",
    "            start, maximum = state.bMarks[nextLine] + state.tShift[nextLine], state.eMarks[nextLine]\n",
    "            if continuation:\n",
    "                continuation = state.src[start:maximum].startswith(\"... \")\n",
    "                if continuation: continue\n",
    "            if state.src[start:maximum].strip():\n",
    "                if state.src[start:maximum].startswith(\">>> \"):\n",
    "                    offset = 1\n",
    "                    break\n",
    "                continue\n",
    "            break\n",
    "            \n",
    "        old_parent, old_line_max = state.parentType, state.lineMax\n",
    "        state.parentType, state.lineMax = \"container\", nextLine-offset\n",
    "        \n",
    "        token = state.push(\"doctest\", \"code\", 0)\n",
    "        token.content = state.src[state.bMarks[startLine] : state.eMarks[state.lineMax]]\n",
    "        token.map = [startLine, state.lineMax]\n",
    "        state.parentType, state.lineMax, state.line = old_parent, old_line_max, nextLine\n",
    "        \n",
    "        return True"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Create a function that renders a doctest token as a docutils node. This feature is available in an rst parser."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "    def render_doctest(self, token)    :\n",
    "        node = docutils.nodes.doctest_block(''.join(token.content), ''.join(token.content))\n",
    "        self.add_line_and_source_path(node, token)\n",
    "        self.current_node.append(node)\n",
    "\n",
    "    myst_parser.docutils_renderer.DocutilsRenderer.render_doctest = render_doctest"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Our markdown parser is only concerned with block objects as we desire to tangle from the docutils document."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "    md = markdown_it.MarkdownIt().disable('inline')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Insert the doctest rule before code. This way it is recognized with and without indents."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "    md.block.ruler.before(\"code\", \"doctest\", doctest, {\"alt\": []},)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Generate the markdown it tokens.s"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "    tokens = md.parse(\"\"\"Testing\n",
    "    other taxes\n",
    "    \n",
    "        >>> 1\n",
    "        10\n",
    "        >>> 2\n",
    "        asdf\n",
    "        \n",
    "        print\n",
    "    \"\"\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Convert the tokens to a docutils document."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<document: <paragraph...><doctest_block...><doctest_block...><liter ...>,\n",
       " <paragraph: >,\n",
       " <doctest_block: <#text: '    >>> 1\\n    10'>>,\n",
       " <#text: '    >>> 1\\n    10'>,\n",
       " <doctest_block: <#text: '    >>> 2\\n     ...'>>,\n",
       " <#text: '    >>> 2\\n    asdf\\n    '>,\n",
       " <literal_block: <#text: 'print\\n'>>,\n",
       " <#text: 'print\\n'>]"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "    myst_parser.docutils_renderer.DocutilsRenderer(md).render(tokens,{},  markdown_it.utils.AttrDict()).traverse()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "https://gist.github.com/cfb55f41f5452ef33ec6fbb4e0bda991\n"
     ]
    }
   ],
   "source": [
    "    if 10:\n",
    "        !gist doctest-myst.ipynb -u cfb55f41f5452ef33ec6fbb4e0bda991"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
 }
	{
	"cells": [
	{
	"cell_type": "markdown",
	"metadata": {},
	"source": [
	"Adding doctests to the markdown it lexer and the docutils renderer in the myst the stack."
	]
	},
	{
	"cell_type": "code",
	"execution_count": 1,
	"metadata": {},
	"outputs": [],
	"source": [
	" import markdown_it, docutils.nodes, myst_parser.docutils_renderer"
	]
	},
	{
	"cell_type": "markdown",
	"metadata": {},
	"source": [
	"Create a lexing rule for markdown_it for doctests."
	]
	},
	{
	"cell_type": "code",
	"execution_count": 2,
	"metadata": {},
	"outputs": [],
	"source": [
	" def doctest(state, startLine, endLine, silent, *, offset=0, continuation=True):\n",
	" nextLine, start, maximum = startLine, state.bMarks[startLine] + state.tShift[startLine], state.eMarks[startLine]\n",
	" \n",
	" if not state.src[start:maximum].startswith(\">>> \"): return False\n",
	" while nextLine < endLine: \n",
	" nextLine += 1\n",
	" start, maximum = state.bMarks[nextLine] + state.tShift[nextLine], state.eMarks[nextLine]\n",
	" if continuation:\n",
	" continuation = state.src[start:maximum].startswith(\"... \")\n",
	" if continuation: continue\n",
	" if state.src[start:maximum].strip():\n",
	" if state.src[start:maximum].startswith(\">>> \"):\n",
	" offset = 1\n",
	" break\n",
	" continue\n",
	" break\n",
	" \n",
	" old_parent, old_line_max = state.parentType, state.lineMax\n",
	" state.parentType, state.lineMax = \"container\", nextLine-offset\n",
	" \n",
	" token = state.push(\"doctest\", \"code\", 0)\n",
	" token.content = state.src[state.bMarks[startLine] : state.eMarks[state.lineMax]]\n",
	" token.map = [startLine, state.lineMax]\n",
	" state.parentType, state.lineMax, state.line = old_parent, old_line_max, nextLine\n",
	" \n",
	" return True"
	]
	},
	{
	"cell_type": "markdown",
	"metadata": {},
	"source": [
	"Create a function that renders a doctest token as a docutils node. This feature is available in an rst parser."
	]
	},
	{
	"cell_type": "code",
	"execution_count": 3,
	"metadata": {},
	"outputs": [],
	"source": [
	" def render_doctest(self, token) :\n",
	" node = docutils.nodes.doctest_block(''.join(token.content), ''.join(token.content))\n",
	" self.add_line_and_source_path(node, token)\n",
	" self.current_node.append(node)\n",
	"\n",
	" myst_parser.docutils_renderer.DocutilsRenderer.render_doctest = render_doctest"
	]
	},
	{
	"cell_type": "markdown",
	"metadata": {},
	"source": [
	"Our markdown parser is only concerned with block objects as we desire to tangle from the docutils document."
	]
	},
	{
	"cell_type": "code",
	"execution_count": 4,
	"metadata": {},
	"outputs": [],
	"source": [
	" md = markdown_it.MarkdownIt().disable('inline')"
	]
	},
	{
	"cell_type": "markdown",
	"metadata": {},
	"source": [
	"Insert the doctest rule before code. This way it is recognized with and without indents."
	]
	},
	{
	"cell_type": "code",
	"execution_count": 5,
	"metadata": {},
	"outputs": [],
	"source": [
	" md.block.ruler.before(\"code\", \"doctest\", doctest, {\"alt\": []},)"
	]
	},
	{
	"cell_type": "markdown",
	"metadata": {},
	"source": [
	"Generate the markdown it tokens.s"
	]
	},
	{
	"cell_type": "code",
	"execution_count": 6,
	"metadata": {},
	"outputs": [],
	"source": [
	" tokens = md.parse(\"\"\"Testing\n",
	" other taxes\n",
	" \n",
	" >>> 1\n",
	" 10\n",
	" >>> 2\n",
	" asdf\n",
	" \n",
	" print\n",
	" \"\"\")"
	]
	},
	{
	"cell_type": "markdown",
	"metadata": {},
	"source": [
	"Convert the tokens to a docutils document."
	]
	},
	{
	"cell_type": "code",
	"execution_count": 7,
	"metadata": {},
	"outputs": [
	{
	"data": {
	"text/plain": [
	"[<document: <paragraph...><doctest_block...><doctest_block...><liter ...>,\n",
	" <paragraph: >,\n",
	" <doctest_block: <#text: ' >>> 1\\n 10'>>,\n",
	" <#text: ' >>> 1\\n 10'>,\n",
	" <doctest_block: <#text: ' >>> 2\\n ...'>>,\n",
	" <#text: ' >>> 2\\n asdf\\n '>,\n",
	" <literal_block: <#text: 'print\\n'>>,\n",
	" <#text: 'print\\n'>]"
	]
	},
	"execution_count": 7,
	"metadata": {},
	"output_type": "execute_result"
	}
	],
	"source": [
	" myst_parser.docutils_renderer.DocutilsRenderer(md).render(tokens,{}, markdown_it.utils.AttrDict()).traverse()"
	]
	},
	{
	"cell_type": "code",
	"execution_count": 8,
	"metadata": {},
	"outputs": [
	{
	"name": "stdout",
	"output_type": "stream",
	"text": [
	"https://gist.github.com/cfb55f41f5452ef33ec6fbb4e0bda991\n"
	]
	}
	],
	"source": [
	" if 10:\n",
	" !gist doctest-myst.ipynb -u cfb55f41f5452ef33ec6fbb4e0bda991"
	]
	}
	],
	"metadata": {
	"kernelspec": {
	"display_name": "Python 3",
	"language": "python",
	"name": "python3"
	},
	"language_info": {
	"codemirror_mode": {
	"name": "ipython",
	"version": 3
	},
	"file_extension": ".py",
	"mimetype": "text/x-python",
	"name": "python",
	"nbconvert_exporter": "python",
	"pygments_lexer": "ipython3",
	"version": "3.7.7"
	}
	},
	"nbformat": 4,
	"nbformat_minor": 4
	}