diff --git a/fiddle/examples/colabs/auto_config.ipynb b/fiddle/examples/colabs/auto_config.ipynb
index 362abf53..07f0b5e1 100644
--- a/fiddle/examples/colabs/auto_config.ipynb
+++ b/fiddle/examples/colabs/auto_config.ipynb
@@ -19,7 +19,7 @@
"id": "clAaVdLF-ndS"
},
"source": [
- "## Imports \u0026 model setup\n",
+ "## Imports & model setup\n",
"\n",
"As in the intro, we first import Fiddle, and then JAX and Flax as normal, and then define our model and model-building functions as if we didn't need to worry about configuration."
]
@@ -250,9 +250,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"320pt\" height=\"177pt\"\n viewBox=\"0.00 0.00 320.00 177.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 173)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-173 316,-173 316,4 -4,4\"/\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"109,-28.5 109,-47.5 187,-47.5 187,-28.5 109,-28.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"109,-28.5 109,-47.5 187,-47.5 187,-28.5 109,-28.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"113.5\" y=\"-36.5\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"145.5\" y=\"-36.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"109,-9.5 109,-28.5 166,-28.5 166,-9.5 109,-9.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"109,-9.5 109,-28.5 166,-28.5 166,-9.5 109,-9.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"113\" y=\"-16.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"166,-9.5 166,-28.5 187,-28.5 187,-9.5 166,-9.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"170\" y=\"-16.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e10\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"transparent\" points=\"0,-150 0,-169 312,-169 312,-150 0,-150\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-150 0,-169 312,-169 312,-150 0,-150\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"109.5\" y=\"-158\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"141.5\" y=\"-158\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleMLP\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,-131 0,-150 87,-150 87,-131 0,-131\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-131 0,-150 87,-150 87,-131 0,-131\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"46\" y=\"-138\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edense1\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"87,-131 87,-150 312,-150 312,-131 87,-131\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"91,-135 91,-146 308,-146 308,-135 91,-135\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"91,-135 91,-146 308,-146 308,-135 91,-135\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,-112 0,-131 87,-131 87,-112 0,-112\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-112 0,-131 87,-131 87,-112 0,-112\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4\" y=\"-119\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eactivation_fn\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"87,-112 87,-131 312,-131 312,-112 87,-112\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"91\" y=\"-119\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function sigmoid at 0x7f01361517a0\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,-93 0,-112 87,-112 87,-93 0,-93\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-93 0,-112 87,-112 87,-93 0,-93\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"46\" y=\"-100\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edense2\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"87,-93 87,-112 312,-112 312,-93 87,-93\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"91,-97 91,-108 308,-108 308,-97 91,-97\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"91,-97 91,-108 308,-108 308,-97 91,-97\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M197.63,-134.96C190.48,-119.77 168.85,-73.8 156.63,-47.85\"/\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"205,-37.5 205,-56.5 301,-56.5 301,-37.5 205,-37.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"205,-37.5 205,-56.5 301,-56.5 301,-37.5 205,-37.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"218.5\" y=\"-45.5\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"250.5\" y=\"-45.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"205,-18.5 205,-37.5 262,-37.5 262,-18.5 205,-18.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"205,-18.5 205,-37.5 262,-37.5 262,-18.5 205,-18.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"209\" y=\"-25.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"262,-18.5 262,-37.5 301,-37.5 301,-18.5 262,-18.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"266\" y=\"-25.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"205,0.5 205,-18.5 262,-18.5 262,0.5 205,0.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"205,0.5 205,-18.5 262,-18.5 262,0.5 205,0.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"209\" y=\"-6.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003euse_bias\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"262,0.5 262,-18.5 301,-18.5 301,0.5 262,0.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"266\" y=\"-6.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eFalse\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M203.16,-96.74C208.86,-89.05 221.32,-72.23 232.36,-57.35\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.dot.Graph at 0x7f01221c4a90\u003e"
+ ""
]
},
"execution_count": 6,
@@ -272,7 +272,7 @@
"id": "alA2V9MHoK7F"
},
"source": [
- "\u003e Note: For additional documentation on the visualization used in this colab, see the [visualization, printing, and codegen colab](visualization_printing_codegen.ipynb)."
+ "> Note: For additional documentation on the visualization used in this colab, see the [visualization, printing, and codegen colab](visualization_printing_codegen.ipynb)."
]
},
{
@@ -430,9 +430,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"320pt\" height=\"158pt\"\n viewBox=\"0.00 0.00 320.00 158.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 154)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-154 316,-154 316,4 -4,4\"/\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"113,-19 113,-38 191,-38 191,-19 113,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"113,-19 113,-38 191,-38 191,-19 113,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"117.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"149.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"113,0 113,-19 170,-19 170,0 113,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"113,0 113,-19 170,-19 170,0 113,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"117\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"170,0 170,-19 191,-19 191,0 170,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"174\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e10\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"transparent\" points=\"0,-131 0,-150 312,-150 312,-131 0,-131\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-131 0,-150 312,-150 312,-131 0,-131\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"109.5\" y=\"-139\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"141.5\" y=\"-139\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleMLP\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,-112 0,-131 87,-131 87,-112 0,-112\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-112 0,-131 87,-131 87,-112 0,-112\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"46\" y=\"-119\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edense1\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"87,-112 87,-131 312,-131 312,-112 87,-112\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"91,-116 91,-127 308,-127 308,-116 91,-116\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"91,-116 91,-127 308,-127 308,-116 91,-116\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,-93 0,-112 87,-112 87,-93 0,-93\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-93 0,-112 87,-112 87,-93 0,-93\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4\" y=\"-100\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eactivation_fn\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"87,-93 87,-112 312,-112 312,-93 87,-93\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"91\" y=\"-100\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function sigmoid at 0x7f01361517a0\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,-74 0,-93 87,-93 87,-74 0,-74\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-74 0,-93 87,-93 87,-74 0,-74\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"46\" y=\"-81\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edense2\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"87,-74 87,-93 312,-93 312,-74 87,-74\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"91,-78 91,-89 308,-89 308,-78 91,-78\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"91,-78 91,-89 308,-89 308,-78 91,-78\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M197.55,-115.85C190.83,-101.7 171.82,-61.7 160.6,-38.09\"/\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"210,-19 210,-38 287,-38 287,-19 210,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"210,-19 210,-38 287,-38 287,-19 210,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"214\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"246\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"210,0 210,-19 269,-19 269,0 210,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"210,0 210,-19 269,-19 269,0 210,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"216\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"269,0 269,-19 287,-19 287,0 269,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"273\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M203.15,-77.93C209.28,-70.01 223.16,-52.09 233.87,-38.26\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.dot.Graph at 0x7f0122742e10\u003e"
+ ""
]
},
"execution_count": 9,
@@ -488,9 +488,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"602pt\" height=\"177pt\"\n viewBox=\"0.00 0.00 602.00 177.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 173)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-173 598,-173 598,4 -4,4\"/\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"0,-37.5 0,-56.5 288,-56.5 288,-37.5 0,-37.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-37.5 0,-56.5 288,-56.5 288,-37.5 0,-37.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"109.5\" y=\"-45.5\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"141.5\" y=\"-45.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,-18.5 0,-37.5 75,-37.5 75,-18.5 0,-18.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-18.5 0,-37.5 75,-37.5 75,-18.5 0,-18.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"22\" y=\"-25.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"75,-18.5 75,-37.5 288,-37.5 288,-18.5 75,-18.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"79\" y=\"-25.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e10\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,0.5 0,-18.5 75,-18.5 75,0.5 0,0.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,0.5 0,-18.5 75,-18.5 75,0.5 0,0.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4\" y=\"-6.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003ekernel_init\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"75,0.5 75,-18.5 288,-18.5 288,0.5 75,0.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"79\" y=\"-6.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function zeros at 0x7f013698def0\u0026gt;\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"transparent\" points=\"97,-150 97,-169 409,-169 409,-150 97,-150\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"97,-150 97,-169 409,-169 409,-150 97,-150\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"206.5\" y=\"-158\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"238.5\" y=\"-158\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleMLP\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"97,-131 97,-150 184,-150 184,-131 97,-131\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"97,-131 97,-150 184,-150 184,-131 97,-131\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"143\" y=\"-138\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edense1\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"184,-131 184,-150 409,-150 409,-131 184,-131\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"188,-135 188,-146 405,-146 405,-135 188,-135\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"188,-135 188,-146 405,-146 405,-135 188,-135\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"97,-112 97,-131 184,-131 184,-112 97,-112\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"97,-112 97,-131 184,-131 184,-112 97,-112\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"101\" y=\"-119\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eactivation_fn\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"184,-112 184,-131 409,-131 409,-112 184,-112\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"188\" y=\"-119\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function sigmoid at 0x7f01361517a0\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"97,-93 97,-112 184,-112 184,-93 97,-93\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"97,-93 97,-112 184,-112 184,-93 97,-93\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"143\" y=\"-100\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edense2\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"184,-93 184,-112 409,-112 409,-93 184,-93\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"188,-97 188,-108 405,-108 405,-97 188,-97\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"188,-97 188,-108 405,-108 405,-97 188,-97\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M290.03,-134.96C271.32,-121.45 218.96,-83.63 182.31,-57.17\"/\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"306,-37.5 306,-56.5 594,-56.5 594,-37.5 306,-37.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"306,-37.5 306,-56.5 594,-56.5 594,-37.5 306,-37.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"415.5\" y=\"-45.5\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"447.5\" y=\"-45.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"306,-18.5 306,-37.5 381,-37.5 381,-18.5 306,-18.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"306,-18.5 306,-37.5 381,-37.5 381,-18.5 306,-18.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"328\" y=\"-25.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"381,-18.5 381,-37.5 594,-37.5 594,-18.5 381,-18.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"385\" y=\"-25.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"306,0.5 306,-18.5 381,-18.5 381,0.5 306,0.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"306,0.5 306,-18.5 381,-18.5 381,0.5 306,0.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"310\" y=\"-6.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003ekernel_init\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"381,0.5 381,-18.5 594,-18.5 594,0.5 381,0.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"385\" y=\"-6.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function zeros at 0x7f013698def0\u0026gt;\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M305.66,-96.95C322.04,-89.3 358.78,-72.13 391.09,-57.03\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.dot.Graph at 0x7f012286a810\u003e"
+ ""
]
},
"execution_count": 10,
@@ -547,9 +547,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"326pt\" height=\"158pt\"\n viewBox=\"0.00 0.00 325.50 158.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 154)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-154 321.5,-154 321.5,4 -4,4\"/\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"0,-19 0,-38 78,-38 78,-19 0,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-19 0,-38 78,-38 78,-19 0,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"36.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,0 0,-19 57,-19 57,0 0,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,0 0,-19 57,-19 57,0 0,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"57,0 57,-19 78,-19 78,0 57,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"61\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e10\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"transparent\" points=\"62,-131 62,-150 168,-150 168,-131 62,-131\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" stroke-dasharray=\"5,2\" points=\"62,-131 62,-150 168,-150 168,-131 62,-131\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"66\" y=\"-139\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003ePartial:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"103\" y=\"-139\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleMLP\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" stroke-dasharray=\"5,2\" points=\"62,-112 62,-131 150,-131 150,-112 62,-112\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"62,-112 62,-131 150,-131 150,-112 62,-112\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"109\" y=\"-119\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edense1\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"150,-112 150,-131 168,-131 168,-112 150,-112\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"154,-116 154,-127 164,-127 164,-116 154,-116\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"154,-116 154,-127 164,-127 164,-116 154,-116\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"62,-93 62,-112 150,-112 150,-93 62,-93\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"62,-93 62,-112 150,-112 150,-93 62,-93\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"67\" y=\"-100\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eactivation_fn\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"150,-93 150,-112 168,-112 168,-93 150,-93\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"154,-97 154,-108 164,-108 164,-97 154,-97\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" stroke-dasharray=\"5,2\" points=\"154,-97 154,-108 164,-108 164,-97 154,-97\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" stroke-dasharray=\"5,2\" points=\"62,-74 62,-93 150,-93 150,-74 62,-74\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"62,-74 62,-93 150,-93 150,-74 62,-74\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"109\" y=\"-81\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edense2\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"150,-74 150,-93 168,-93 168,-74 150,-74\"/\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"transparent\" points=\"154,-78 154,-89 164,-89 164,-78 154,-78\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"154,-78 154,-89 164,-89 164,-78 154,-78\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M153.84,-116.66C137.96,-103.29 89.14,-62.2 60.52,-38.12\"/\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"96,-19 96,-38 222,-38 222,-19 96,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" stroke-dasharray=\"5,2\" points=\"96,-19 96,-38 222,-38 222,-19 96,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"107\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003ePartial:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"144\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e leaky_relu\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" stroke-dasharray=\"5,2\" points=\"96,0 96,-19 189,-19 189,0 96,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"96,0 96,-19 189,-19 189,0 96,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"100\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003enegative_slope\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"189,0 189,-19 222,-19 222,0 189,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"193\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e0.05\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M159,-96.65C159,-85.8 159,-57.1 159,-38.06\"/\u003e\n\u003c/g\u003e\n\u003c!-- 3 --\u003e\n\u003cg id=\"node4\" class=\"node\"\u003e\n\u003ctitle\u003e3\u003c/title\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"transparent\" points=\"241,-19 241,-38 318,-38 318,-19 241,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"241,-19 241,-38 318,-38 318,-19 241,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"245\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"277\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"241,0 241,-19 300,-19 300,0 241,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"241,0 241,-19 300,-19 300,0 241,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"247\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"300,0 300,-19 318,-19 318,0 300,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"304\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;3 --\u003e\n\u003cg id=\"edge3\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;3:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M164.16,-79.34C177.75,-72.31 215.47,-52.82 244.01,-38.08\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.dot.Graph at 0x7f01223dc6d0\u003e"
+ ""
]
},
"execution_count": 11,
@@ -605,7 +605,7 @@
" kernel_init = init\n",
" bias_init = zeros\n",
" )\n",
- " activation_fn = functools.partial(\u003cfunction leaky_relu at 0x7f01365703b0\u003e, negative_slope=0.05)\n",
+ " activation_fn = functools.partial(, negative_slope=0.05)\n",
" dense2 = Dense(\n",
" # attributes\n",
" features = 1\n",
@@ -887,9 +887,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"503pt\" height=\"327pt\"\n viewBox=\"0.00 0.00 503.00 327.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 323)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-323 499,-323 499,4 -4,4\"/\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"0.5,-121.5 0.5,-140.5 89.5,-140.5 89.5,-121.5 0.5,-121.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0.5,-121.5 0.5,-140.5 89.5,-140.5 89.5,-121.5 0.5,-121.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4.5\" y=\"-129.5\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"36.5\" y=\"-129.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e PRNGKey\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0.5,-102.5 0.5,-121.5 50.5,-121.5 50.5,-102.5 0.5,-102.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0.5,-102.5 0.5,-121.5 50.5,-121.5 50.5,-102.5 0.5,-102.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"21.5\" y=\"-109.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eseed\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"50.5,-102.5 50.5,-121.5 89.5,-121.5 89.5,-102.5 50.5,-102.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"54.5\" y=\"-109.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e42\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"transparent\" points=\"42.5,-300 42.5,-319 336.5,-319 336.5,-300 42.5,-300\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"42.5,-300 42.5,-319 336.5,-319 336.5,-300 42.5,-300\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"149\" y=\"-308\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"181\" y=\"-308\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Trainer\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"42.5,-281 42.5,-300 105.5,-300 105.5,-281 42.5,-281\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"42.5,-281 42.5,-300 105.5,-300 105.5,-281 42.5,-281\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"82.5\" y=\"-288\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003erng\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"105.5,-281 105.5,-300 336.5,-300 336.5,-281 105.5,-281\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"109.5,-285 109.5,-296 332.5,-296 332.5,-285 109.5,-285\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"109.5,-285 109.5,-296 332.5,-296 332.5,-285 109.5,-285\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"42.5,-262 42.5,-281 105.5,-281 105.5,-262 42.5,-262\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"42.5,-262 42.5,-281 105.5,-281 105.5,-262 42.5,-262\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"70.5\" y=\"-269\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003emodel\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"105.5,-262 105.5,-281 336.5,-281 336.5,-262 105.5,-262\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"109.5,-266 109.5,-277 332.5,-277 332.5,-266 109.5,-266\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"109.5,-266 109.5,-277 332.5,-277 332.5,-266 109.5,-266\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"42.5,-243 42.5,-262 105.5,-262 105.5,-243 42.5,-243\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"42.5,-243 42.5,-262 105.5,-262 105.5,-243 42.5,-243\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"46.5\" y=\"-250\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eoptimizer\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"105.5,-243 105.5,-262 336.5,-262 336.5,-243 105.5,-243\"/\u003e\n\u003cpolygon fill=\"#8fbc8f\" stroke=\"transparent\" points=\"109.5,-247 109.5,-258 332.5,-258 332.5,-247 109.5,-247\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"109.5,-247 109.5,-258 332.5,-258 332.5,-247 109.5,-247\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"42.5,-224 42.5,-243 105.5,-243 105.5,-224 42.5,-224\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"42.5,-224 42.5,-243 105.5,-243 105.5,-224 42.5,-224\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"58.5\" y=\"-231\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eloss_fn\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"105.5,-224 105.5,-243 336.5,-243 336.5,-224 105.5,-224\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"109.5\" y=\"-231\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function mse_loss at 0x7f01223e5f80\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"42.5,-205 42.5,-224 105.5,-224 105.5,-205 42.5,-205\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"42.5,-205 42.5,-224 105.5,-224 105.5,-205 42.5,-205\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"52.5\" y=\"-212\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eexamples\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"105.5,-205 105.5,-224 336.5,-224 336.5,-205 105.5,-205\"/\u003e\n\u003cpolygon fill=\"#adff2f\" stroke=\"transparent\" points=\"109.5,-209 109.5,-220 332.5,-220 332.5,-209 109.5,-209\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"109.5,-209 109.5,-220 332.5,-220 332.5,-209 109.5,-209\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M216.01,-284.8C192.96,-262.99 103.39,-178.23 63.66,-140.64\"/\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node4\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"107.5,-140.5 107.5,-159.5 210.5,-159.5 210.5,-140.5 107.5,-140.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"107.5,-140.5 107.5,-159.5 210.5,-159.5 210.5,-140.5 107.5,-140.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"112.5\" y=\"-148.5\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"144.5\" y=\"-148.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleMLP\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"107.5,-121.5 107.5,-140.5 194.5,-140.5 194.5,-121.5 107.5,-121.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"107.5,-121.5 107.5,-140.5 194.5,-140.5 194.5,-121.5 107.5,-121.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"153.5\" y=\"-128.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edense1\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"194.5,-121.5 194.5,-140.5 210.5,-140.5 210.5,-121.5 194.5,-121.5\"/\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"transparent\" points=\"198.5,-125.5 198.5,-136.5 206.5,-136.5 206.5,-125.5 198.5,-125.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"198.5,-125.5 198.5,-136.5 206.5,-136.5 206.5,-125.5 198.5,-125.5\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"107.5,-102.5 107.5,-121.5 194.5,-121.5 194.5,-102.5 107.5,-102.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"107.5,-102.5 107.5,-121.5 194.5,-121.5 194.5,-102.5 107.5,-102.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"111.5\" y=\"-109.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eactivation_fn\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"194.5,-102.5 194.5,-121.5 210.5,-121.5 210.5,-102.5 194.5,-102.5\"/\u003e\n\u003cpolygon fill=\"#add8e6\" stroke=\"transparent\" points=\"198.5,-106.5 198.5,-117.5 206.5,-117.5 206.5,-106.5 198.5,-106.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" stroke-dasharray=\"5,2\" points=\"198.5,-106.5 198.5,-117.5 206.5,-117.5 206.5,-106.5 198.5,-106.5\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" stroke-dasharray=\"5,2\" points=\"107.5,-83.5 107.5,-102.5 194.5,-102.5 194.5,-83.5 107.5,-83.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"107.5,-83.5 107.5,-102.5 194.5,-102.5 194.5,-83.5 107.5,-83.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"153.5\" y=\"-90.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edense2\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"194.5,-83.5 194.5,-102.5 210.5,-102.5 210.5,-83.5 194.5,-83.5\"/\u003e\n\u003cpolygon fill=\"#ff8c00\" stroke=\"transparent\" points=\"198.5,-87.5 198.5,-98.5 206.5,-98.5 206.5,-87.5 198.5,-87.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"198.5,-87.5 198.5,-98.5 206.5,-98.5 206.5,-87.5 198.5,-87.5\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge5\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M219.26,-265.71C212.18,-249.03 189.85,-196.4 174.33,-159.82\"/\u003e\n\u003c/g\u003e\n\u003c!-- 6 --\u003e\n\u003cg id=\"node7\" class=\"node\"\u003e\n\u003ctitle\u003e6\u003c/title\u003e\n\u003cpolygon fill=\"#8fbc8f\" stroke=\"transparent\" points=\"228.5,-121.5 228.5,-140.5 342.5,-140.5 342.5,-121.5 228.5,-121.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"228.5,-121.5 228.5,-140.5 342.5,-140.5 342.5,-121.5 228.5,-121.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"257\" y=\"-129.5\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"289\" y=\"-129.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e sgd\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"228.5,-102.5 228.5,-121.5 315.5,-121.5 315.5,-102.5 228.5,-102.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"228.5,-102.5 228.5,-121.5 315.5,-121.5 315.5,-102.5 228.5,-102.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"232.5\" y=\"-109.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003elearning_rate\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"315.5,-102.5 315.5,-121.5 342.5,-121.5 342.5,-102.5 315.5,-102.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"319.5\" y=\"-109.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e0.1\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;6 --\u003e\n\u003cg id=\"edge6\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;6:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M223.63,-246.72C231.78,-230.35 261.33,-171.03 276.45,-140.67\"/\u003e\n\u003c/g\u003e\n\u003c!-- 7 --\u003e\n\u003cg id=\"node9\" class=\"node\"\u003e\n\u003ctitle\u003e7\u003c/title\u003e\n\u003cpolygon fill=\"#adff2f\" stroke=\"transparent\" points=\"361.5,-149.5 361.5,-168.5 462.5,-168.5 462.5,-149.5 361.5,-149.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"361.5,-149.5 361.5,-168.5 462.5,-168.5 462.5,-149.5 361.5,-149.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"365.5\" y=\"-157.5\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"397.5\" y=\"-157.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e make_data\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"361.5,-130.5 361.5,-149.5 438.5,-149.5 438.5,-130.5 361.5,-130.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"361.5,-130.5 361.5,-149.5 438.5,-149.5 438.5,-130.5 361.5,-130.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"415.5\" y=\"-137.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003ekey\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"438.5,-130.5 438.5,-149.5 462.5,-149.5 462.5,-130.5 438.5,-130.5\"/\u003e\n\u003cpolygon fill=\"#ff6347\" stroke=\"transparent\" points=\"442.5,-134.5 442.5,-145.5 458.5,-145.5 458.5,-134.5 442.5,-134.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"442.5,-134.5 442.5,-145.5 458.5,-145.5 458.5,-134.5 442.5,-134.5\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"361.5,-111.5 361.5,-130.5 438.5,-130.5 438.5,-111.5 361.5,-111.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"361.5,-111.5 361.5,-130.5 438.5,-130.5 438.5,-111.5 361.5,-111.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"367.5\" y=\"-118.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003enum_batches\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"438.5,-111.5 438.5,-130.5 462.5,-130.5 462.5,-111.5 438.5,-111.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"442.5\" y=\"-118.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e10\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"361.5,-92.5 361.5,-111.5 438.5,-111.5 438.5,-92.5 361.5,-92.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"361.5,-92.5 361.5,-111.5 438.5,-111.5 438.5,-92.5 361.5,-92.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"373.5\" y=\"-99.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003ebatch_size\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"438.5,-92.5 438.5,-111.5 462.5,-111.5 462.5,-92.5 438.5,-92.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"442.5\" y=\"-99.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e32\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"361.5,-73.5 361.5,-92.5 438.5,-92.5 438.5,-73.5 361.5,-73.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"361.5,-73.5 361.5,-92.5 438.5,-92.5 438.5,-73.5 361.5,-73.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"373.5\" y=\"-80.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003einput_dims\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"438.5,-73.5 438.5,-92.5 462.5,-92.5 462.5,-73.5 438.5,-73.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"442.5\" y=\"-80.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e20\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;7 --\u003e\n\u003cg id=\"edge8\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;7:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M239.51,-208.93C265.34,-202.65 313.93,-189.18 351.5,-169 354.63,-167.32 357.78,-165.47 360.89,-163.52\"/\u003e\n\u003c/g\u003e\n\u003c!-- 3 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e3\u003c/title\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"transparent\" points=\"43.5,-19 43.5,-38 121.5,-38 121.5,-19 43.5,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"43.5,-19 43.5,-38 121.5,-38 121.5,-19 43.5,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"48\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"80\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"43.5,0 43.5,-19 100.5,-19 100.5,0 43.5,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"43.5,0 43.5,-19 100.5,-19 100.5,0 43.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"47.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"100.5,0 100.5,-19 121.5,-19 121.5,0 100.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"104.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e10\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 2\u0026#45;\u0026#45;3 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e2:c\u0026#45;\u0026#45;3:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M198.23,-126.57C183.03,-112.57 130.95,-64.61 102.11,-38.06\"/\u003e\n\u003c/g\u003e\n\u003c!-- 4 --\u003e\n\u003cg id=\"node5\" class=\"node\"\u003e\n\u003ctitle\u003e4\u003c/title\u003e\n\u003cpolygon fill=\"#add8e6\" stroke=\"transparent\" points=\"139.5,-19 139.5,-38 265.5,-38 265.5,-19 139.5,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" stroke-dasharray=\"5,2\" points=\"139.5,-19 139.5,-38 265.5,-38 265.5,-19 139.5,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"150.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003ePartial:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"187.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e leaky_relu\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" stroke-dasharray=\"5,2\" points=\"139.5,0 139.5,-19 232.5,-19 232.5,0 139.5,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"139.5,0 139.5,-19 232.5,-19 232.5,0 139.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"143.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003enegative_slope\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"232.5,0 232.5,-19 265.5,-19 265.5,0 232.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"236.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e0.02\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 2\u0026#45;\u0026#45;4 --\u003e\n\u003cg id=\"edge3\" class=\"edge\"\u003e\n\u003ctitle\u003e2:c\u0026#45;\u0026#45;4:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M202.5,-106.38C202.5,-94.55 202.5,-59.98 202.5,-38.33\"/\u003e\n\u003c/g\u003e\n\u003c!-- 5 --\u003e\n\u003cg id=\"node6\" class=\"node\"\u003e\n\u003ctitle\u003e5\u003c/title\u003e\n\u003cpolygon fill=\"#ff8c00\" stroke=\"transparent\" points=\"284.5,-19 284.5,-38 361.5,-38 361.5,-19 284.5,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"284.5,-19 284.5,-38 361.5,-38 361.5,-19 284.5,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"288.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"320.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"284.5,0 284.5,-19 343.5,-19 343.5,0 284.5,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"284.5,0 284.5,-19 343.5,-19 343.5,0 284.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"290.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"343.5,0 343.5,-19 361.5,-19 361.5,0 343.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"347.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 2\u0026#45;\u0026#45;5 --\u003e\n\u003cg id=\"edge4\" class=\"edge\"\u003e\n\u003ctitle\u003e2:c\u0026#45;\u0026#45;5:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M205.83,-87.39C209.05,-83.59 214.21,-77.95 219.5,-74 239.24,-59.26 263.55,-46.31 283.6,-36.78\"/\u003e\n\u003c/g\u003e\n\u003c!-- 8 --\u003e\n\u003cg id=\"node8\" class=\"node\"\u003e\n\u003ctitle\u003e8\u003c/title\u003e\n\u003cpolygon fill=\"#ff6347\" stroke=\"transparent\" points=\"406.5,-19 406.5,-38 495.5,-38 495.5,-19 406.5,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"406.5,-19 406.5,-38 495.5,-38 495.5,-19 406.5,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"410.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"442.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e PRNGKey\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"406.5,0 406.5,-19 456.5,-19 456.5,0 406.5,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"406.5,0 406.5,-19 456.5,-19 456.5,0 406.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"427.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eseed\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"456.5,0 456.5,-19 495.5,-19 495.5,0 456.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"460.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e13\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 7\u0026#45;\u0026#45;8 --\u003e\n\u003cg id=\"edge7\" class=\"edge\"\u003e\n\u003ctitle\u003e7:c\u0026#45;\u0026#45;8:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M450.5,-134.37C450.5,-117.93 450.5,-66.04 450.5,-38.15\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.dot.Graph at 0x7f01223f53d0\u003e"
+ ""
]
},
"execution_count": 15,
diff --git a/fiddle/examples/colabs/basic_api.ipynb b/fiddle/examples/colabs/basic_api.ipynb
index f346f917..0368073f 100644
--- a/fiddle/examples/colabs/basic_api.ipynb
+++ b/fiddle/examples/colabs/basic_api.ipynb
@@ -196,7 +196,7 @@
"try:\n",
" foo_config.qux = 4\n",
"except AttributeError as e:\n",
- " display(HTML(f'\u003cspan style=\"color: red\"\u003eTypeError: {e}\u003c/span\u003e'))\n",
+ " display(HTML(f'TypeError: {e}'))\n",
"else:\n",
" raise AssertionError(\"This should raise an error!\")"
]
@@ -302,7 +302,7 @@
"try:\n",
" p_config[:] = [1, 2, 3, 4, 5, 6]\n",
"except ValueError as e:\n",
- " display(HTML(f'\u003cspan style=\"color: red\"\u003eValueError: {e}\u003c/span\u003e'))\n",
+ " display(HTML(f'ValueError: {e}'))\n",
"\n",
"# To achieve the same purpose, modify variadic positional args separately.\n",
"p_config[:fdl.VARARGS] = [1, 2, 3]\n",
@@ -453,7 +453,7 @@
},
"outputs": [],
"source": [
- "def trainer_config() -\u003e fdl.Config:\n",
+ "def trainer_config() -> fdl.Config:\n",
" checkpointer_config = fdl.Partial(\n",
" Checkpointer, base_directory=\"/path/to/my/dir\", checkpoints_to_keep=5)\n",
" return fdl.Config(Trainer, checkpointer_cls=checkpointer_config)\n",
@@ -576,8 +576,8 @@
"try:\n",
" fdl.build(fdl.Config(bar))\n",
"except Exception as e:\n",
- " error_message = str(e).replace(\"\\n\", \"\u003cbr/\u003e\")\n",
- " display(HTML(f'\u003cspan style=\"color: red\"\u003e{type(e).__name__}: {error_message}\u003c/span\u003e'))\n",
+ " error_message = str(e).replace(\"\\n\", \"
\")\n",
+ " display(HTML(f'{type(e).__name__}: {error_message}'))\n",
"else:\n",
" raise AssertionError(\"This should raise an error!\")"
]
@@ -601,7 +601,7 @@
},
"outputs": [],
"source": [
- "def my_error_function(a) -\u003e Foo:\n",
+ "def my_error_function(a) -> Foo:\n",
" raise ValueError(\"Error!\")\n",
"\n",
"foo_config = fdl.Config(Foo, a=1)\n",
@@ -609,8 +609,8 @@
"try:\n",
" fdl.build(config)\n",
"except Exception as e:\n",
- " error_message = str(e).replace(\"\\n\", \"\u003cbr/\u003e\")\n",
- " display(HTML(f'\u003cspan style=\"color: red\"\u003e{type(e).__name__}: {error_message}\u003c/span\u003e'))\n",
+ " error_message = str(e).replace(\"\\n\", \"
\")\n",
+ " display(HTML(f'{type(e).__name__}: {error_message}'))\n",
"\n",
"else:\n",
" raise AssertionError(\"This should raise an error!\")"
@@ -669,7 +669,7 @@
"class FooWithId(Foo):\n",
"\n",
" def __repr__(self):\n",
- " return f\"Foo\u003c{id(self)}\u003e(a={self.a})\"\n",
+ " return f\"Foo<{id(self)}>(a={self.a})\"\n",
"\n",
"\n",
"foo_config = fdl.Config(FooWithId, a=1)\n",
@@ -751,7 +751,7 @@
"try:\n",
" hash(config)\n",
"except TypeError as e:\n",
- " display(HTML(f'\u003cspan style=\"color: red\"\u003eTypeError: {e}\u003c/span\u003e'))\n",
+ " display(HTML(f'TypeError: {e}'))\n",
"else:\n",
" raise AssertionError(\"This should raise an error!\")"
]
diff --git a/fiddle/examples/colabs/fiddle_tutorial_with_flax.ipynb b/fiddle/examples/colabs/fiddle_tutorial_with_flax.ipynb
index 8e994e7f..25107448 100644
--- a/fiddle/examples/colabs/fiddle_tutorial_with_flax.ipynb
+++ b/fiddle/examples/colabs/fiddle_tutorial_with_flax.ipynb
@@ -19,7 +19,7 @@
"id": "E2AM3bRspe0Y"
},
"source": [
- "\u003e Note to the reader: use the outline feature in Colab to easily navigate between the different sections of this tutorial."
+ "> Note to the reader: use the outline feature in Colab to easily navigate between the different sections of this tutorial."
]
},
{
@@ -69,7 +69,7 @@
"\n",
"Here, we use JAX and Flax to define our working example. When starting out in a new codebase, we recommend _not_ using Fiddle. Instead, just write your code \"normally\"; Fiddle is designed to be gradually added to a codebase when the codebase has scaled (either in size or in number of concurrent users) to justify adding the dependency.\n",
"\n",
- "\u003e This Fiddle design principle is related to the concept of \"progressive disclosure of complexity\", where you only need to pay for conceptual overhead when it is a worthwhile tradeoff."
+ "> This Fiddle design principle is related to the concept of \"progressive disclosure of complexity\", where you only need to pay for conceptual overhead when it is a worthwhile tradeoff."
]
},
{
@@ -203,7 +203,7 @@
"id": "Qs_XsuI_KCEv"
},
"source": [
- "\u003e Note: You can use `fiddle.experimental.auto_config` to avoid rewriting `make_model`. Please see the [`auto_config` tutorial][auto_config] for more details.\n",
+ "> Note: You can use `fiddle.experimental.auto_config` to avoid rewriting `make_model`. Please see the [`auto_config` tutorial][auto_config] for more details.\n",
"\n",
"[auto_config]: https://colab.sandbox.google.com/github/google/fiddle/blob/main/fiddle/examples/colabs/auto_config.ipynb"
]
@@ -609,7 +609,7 @@
"\n",
" def __call__(self, query, document):\n",
" return jnp.einsum(\n",
- " '...h,...h-\u003e...',\n",
+ " '...h,...h->...',\n",
" self.encode_query(query),\n",
" self.encode_document(document),\n",
" )\n",
@@ -768,7 +768,7 @@
" precision = None\n",
" kernel_init = init\n",
" bias_init = zeros\n",
- " ), \u003cfunction gelu at 0x7faa19d3eef0\u003e, Dense(\n",
+ " ), , Dense(\n",
" # attributes\n",
" features = 1\n",
" use_bias = True\n",
@@ -776,7 +776,7 @@
" precision = None\n",
" kernel_init = init\n",
" bias_init = zeros\n",
- " ), \u003cfunction softmax at 0x7faa19d3f0e0\u003e]\n",
+ " ), ]\n",
")\n",
"\n",
"Param shapes:\n",
@@ -859,7 +859,7 @@
"\n",
"You can ask Fiddle to make a graphical visualization for a Fiddle configuration. This can be really helpful when trying to quickly understand an unfamiliar codebase, or to ensure an experiment is doing exactly what you expect.\n",
"\n",
- "\u003e Note: by calling `fiddle.extensions.jax.enable()` you get a prettier visualization, but it is not required."
+ "> Note: by calling `fiddle.extensions.jax.enable()` you get a prettier visualization, but it is not required."
]
},
{
@@ -886,9 +886,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"525pt\" height=\"156pt\"\n viewBox=\"0.00 0.00 525.00 156.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 152)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-152 521,-152 521,4 -4,4\"/\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"19.5,-19 19.5,-38 96.5,-38 96.5,-19 19.5,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"19.5,-19 19.5,-38 96.5,-38 96.5,-19 19.5,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"23.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"55.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"19.5,0 19.5,-19 78.5,-19 78.5,0 19.5,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"19.5,0 19.5,-19 78.5,-19 78.5,0 19.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"25.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"78.5,0 78.5,-19 96.5,-19 96.5,0 78.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"82.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e4\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"transparent\" points=\"0.5,-129 0.5,-148 517.5,-148 517.5,-129 0.5,-129\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0.5,-129 0.5,-148 517.5,-148 517.5,-129 0.5,-129\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"209.5\" y=\"-137\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"241.5\" y=\"-137\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Sequential\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0.5,-74 0.5,-129 45.5,-129 45.5,-74 0.5,-74\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0.5,-74 0.5,-129 45.5,-129 45.5,-74 0.5,-74\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4.5\" y=\"-99\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003elayers\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"45.5,-74 45.5,-129 517.5,-129 517.5,-74 45.5,-74\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"49.5,-106 49.5,-125 513.5,-125 513.5,-106 49.5,-106\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"49.5,-106 49.5,-125 513.5,-125 513.5,-106 49.5,-106\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"269\" y=\"-113\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003elist\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"49.5,-87 49.5,-106 65.5,-106 65.5,-87 49.5,-87\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"53.5,-91 53.5,-102 61.5,-102 61.5,-91 53.5,-91\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"53.5,-91 53.5,-102 61.5,-102 61.5,-91 53.5,-91\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"65.5,-87 65.5,-106 272.5,-106 272.5,-87 65.5,-87\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"69.5\" y=\"-94\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function gelu at 0x7faa19d3eef0\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"272.5,-87 272.5,-106 288.5,-106 288.5,-87 272.5,-87\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"276.5,-91 276.5,-102 284.5,-102 284.5,-91 276.5,-91\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"276.5,-91 276.5,-102 284.5,-102 284.5,-91 276.5,-91\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"288.5,-87 288.5,-106 513.5,-106 513.5,-87 288.5,-87\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"292.5\" y=\"-94\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function softmax at 0x7faa19d3f0e0\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"49.5,-78 49.5,-87 65.5,-87 65.5,-78 49.5,-78\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"49.5,-78 49.5,-87 65.5,-87 65.5,-78 49.5,-78\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"55.5\" y=\"-81.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e0\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"65.5,-78 65.5,-87 272.5,-87 272.5,-78 65.5,-78\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"65.5,-78 65.5,-87 272.5,-87 272.5,-78 65.5,-78\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"167\" y=\"-81.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e1\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"272.5,-78 272.5,-87 288.5,-87 288.5,-78 272.5,-78\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"272.5,-78 272.5,-87 288.5,-87 288.5,-78 272.5,-78\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"278.5\" y=\"-81.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e2\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"288.5,-78 288.5,-87 513.5,-87 513.5,-78 288.5,-78\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"288.5,-78 288.5,-87 513.5,-87 513.5,-78 288.5,-78\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"399\" y=\"-81.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e3\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M57.5,-90.97C57.5,-81.17 57.5,-55.63 57.5,-38.02\"/\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"242.5,-19 242.5,-38 319.5,-38 319.5,-19 242.5,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"242.5,-19 242.5,-38 319.5,-38 319.5,-19 242.5,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"246.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"278.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"242.5,0 242.5,-19 301.5,-19 301.5,0 242.5,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"242.5,0 242.5,-19 301.5,-19 301.5,0 242.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"248.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"301.5,0 301.5,-19 319.5,-19 319.5,0 301.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"305.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M280.5,-90.97C280.5,-81.17 280.5,-55.63 280.5,-38.02\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.dot.Graph at 0x7faa27f8d350\u003e"
+ ""
]
},
"execution_count": 16,
@@ -933,9 +933,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"541pt\" height=\"156pt\"\n viewBox=\"0.00 0.00 541.00 156.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 152)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-152 537,-152 537,4 -4,4\"/\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"19.5,-19 19.5,-38 96.5,-38 96.5,-19 19.5,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"19.5,-19 19.5,-38 96.5,-38 96.5,-19 19.5,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"23.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"55.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"19.5,0 19.5,-19 78.5,-19 78.5,0 19.5,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"19.5,0 19.5,-19 78.5,-19 78.5,0 19.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"25.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"78.5,0 78.5,-19 96.5,-19 96.5,0 78.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"82.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e4\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"transparent\" points=\"0.5,-129 0.5,-148 533.5,-148 533.5,-129 0.5,-129\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0.5,-129 0.5,-148 533.5,-148 533.5,-129 0.5,-129\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"217.5\" y=\"-137\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"249.5\" y=\"-137\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Sequential\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0.5,-74 0.5,-129 45.5,-129 45.5,-74 0.5,-74\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0.5,-74 0.5,-129 45.5,-129 45.5,-74 0.5,-74\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4.5\" y=\"-99\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003elayers\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"45.5,-74 45.5,-129 533.5,-129 533.5,-74 45.5,-74\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"49.5,-106 49.5,-125 529.5,-125 529.5,-106 49.5,-106\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"49.5,-106 49.5,-125 529.5,-125 529.5,-106 49.5,-106\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"277\" y=\"-113\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003elist\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"49.5,-87 49.5,-106 65.5,-106 65.5,-87 49.5,-87\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"53.5,-91 53.5,-102 61.5,-102 61.5,-91 53.5,-91\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"53.5,-91 53.5,-102 61.5,-102 61.5,-91 53.5,-91\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"65.5,-87 65.5,-106 272.5,-106 272.5,-87 65.5,-87\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"69.5\" y=\"-94\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function gelu at 0x7faa19d3eef0\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"272.5,-87 272.5,-106 288.5,-106 288.5,-87 272.5,-87\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"276.5,-91 276.5,-102 284.5,-102 284.5,-91 276.5,-91\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"276.5,-91 276.5,-102 284.5,-102 284.5,-91 276.5,-91\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"288.5,-87 288.5,-106 513.5,-106 513.5,-87 288.5,-87\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"292.5\" y=\"-94\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function softmax at 0x7faa19d3f0e0\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"513.5,-87 513.5,-106 529.5,-106 529.5,-87 513.5,-87\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"517.5,-91 517.5,-102 525.5,-102 525.5,-91 517.5,-91\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"517.5,-91 517.5,-102 525.5,-102 525.5,-91 517.5,-91\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"49.5,-78 49.5,-87 65.5,-87 65.5,-78 49.5,-78\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"49.5,-78 49.5,-87 65.5,-87 65.5,-78 49.5,-78\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"55.5\" y=\"-81.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e0\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"65.5,-78 65.5,-87 272.5,-87 272.5,-78 65.5,-78\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"65.5,-78 65.5,-87 272.5,-87 272.5,-78 65.5,-78\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"167\" y=\"-81.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e1\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"272.5,-78 272.5,-87 288.5,-87 288.5,-78 272.5,-78\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"272.5,-78 272.5,-87 288.5,-87 288.5,-78 272.5,-78\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"278.5\" y=\"-81.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e2\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"288.5,-78 288.5,-87 513.5,-87 513.5,-78 288.5,-78\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"288.5,-78 288.5,-87 513.5,-87 513.5,-78 288.5,-78\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"399\" y=\"-81.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e3\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"513.5,-78 513.5,-87 529.5,-87 529.5,-78 513.5,-78\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"513.5,-78 513.5,-87 529.5,-87 529.5,-78 513.5,-78\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"519.5\" y=\"-81.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e4\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M57.5,-90.97C57.5,-81.17 57.5,-55.63 57.5,-38.02\"/\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"362.5,-19 362.5,-38 439.5,-38 439.5,-19 362.5,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"362.5,-19 362.5,-38 439.5,-38 439.5,-19 362.5,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"366.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"398.5\" y=\"-27\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"362.5,0 362.5,-19 421.5,-19 421.5,0 362.5,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"362.5,0 362.5,-19 421.5,-19 421.5,0 362.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"368.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"421.5,0 421.5,-19 439.5,-19 439.5,0 421.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"425.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M284.77,-92.33C298.42,-83.8 341.84,-56.66 371.44,-38.16\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge3\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M517.47,-92.5C504.02,-84.17 459.8,-56.76 429.75,-38.13\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.dot.Graph at 0x7fa9fee0bcd0\u003e"
+ ""
]
},
"execution_count": 17,
@@ -985,9 +985,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"553pt\" height=\"175pt\"\n viewBox=\"0.00 0.00 552.50 175.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 171)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-171 548.5,-171 548.5,4 -4,4\"/\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"0,-37.5 0,-56.5 138,-56.5 138,-37.5 0,-37.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-37.5 0,-56.5 138,-56.5 138,-37.5 0,-37.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"34.5\" y=\"-45.5\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"66.5\" y=\"-45.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,-18.5 0,-37.5 57,-37.5 57,-18.5 0,-18.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-18.5 0,-37.5 57,-37.5 57,-18.5 0,-18.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4\" y=\"-25.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"57,-18.5 57,-37.5 138,-37.5 138,-18.5 57,-18.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"61\" y=\"-25.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e4\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,0.5 0,-18.5 57,-18.5 57,0.5 0,0.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,0.5 0,-18.5 57,-18.5 57,0.5 0,0.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"22\" y=\"-6.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edtype\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"57,0.5 57,-18.5 138,-18.5 138,0.5 57,0.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"61\" y=\"-6.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003ejnp.bfloat16\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"transparent\" points=\"12,-148 12,-167 545,-167 545,-148 12,-148\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"12,-148 12,-167 545,-167 545,-148 12,-148\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"229\" y=\"-156\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"261\" y=\"-156\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Sequential\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"12,-93 12,-148 57,-148 57,-93 12,-93\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"12,-93 12,-148 57,-148 57,-93 12,-93\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"16\" y=\"-118\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003elayers\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"57,-93 57,-148 545,-148 545,-93 57,-93\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"61,-125 61,-144 541,-144 541,-125 61,-125\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"61,-125 61,-144 541,-144 541,-125 61,-125\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"288.5\" y=\"-132\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003elist\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"61,-106 61,-125 77,-125 77,-106 61,-106\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"65,-110 65,-121 73,-121 73,-110 65,-110\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"65,-110 65,-121 73,-121 73,-110 65,-110\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"77,-106 77,-125 284,-125 284,-106 77,-106\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"81\" y=\"-113\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function gelu at 0x7faa19d3eef0\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"284,-106 284,-125 300,-125 300,-106 284,-106\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"288,-110 288,-121 296,-121 296,-110 288,-110\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"288,-110 288,-121 296,-121 296,-110 288,-110\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"300,-106 300,-125 525,-125 525,-106 300,-106\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"304\" y=\"-113\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function softmax at 0x7faa19d3f0e0\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"525,-106 525,-125 541,-125 541,-106 525,-106\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"529,-110 529,-121 537,-121 537,-110 529,-110\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"529,-110 529,-121 537,-121 537,-110 529,-110\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"61,-97 61,-106 77,-106 77,-97 61,-97\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"61,-97 61,-106 77,-106 77,-97 61,-97\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"67\" y=\"-100.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e0\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"77,-97 77,-106 284,-106 284,-97 77,-97\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"77,-97 77,-106 284,-106 284,-97 77,-97\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"178.5\" y=\"-100.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e1\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"284,-97 284,-106 300,-106 300,-97 284,-97\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"284,-97 284,-106 300,-106 300,-97 284,-97\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"290\" y=\"-100.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e2\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"300,-97 300,-106 525,-106 525,-97 300,-97\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"300,-97 300,-106 525,-106 525,-97 300,-97\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"410.5\" y=\"-100.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e3\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"525,-97 525,-106 541,-106 541,-97 525,-97\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"525,-97 525,-106 541,-106 541,-97 525,-97\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"531\" y=\"-100.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e4\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M69,-109.92C69,-100.5 69,-76.51 69,-57.16\"/\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"344,-37.5 344,-56.5 482,-56.5 482,-37.5 344,-37.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"344,-37.5 344,-56.5 482,-56.5 482,-37.5 344,-37.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"378.5\" y=\"-45.5\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"410.5\" y=\"-45.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"344,-18.5 344,-37.5 401,-37.5 401,-18.5 344,-18.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"344,-18.5 344,-37.5 401,-37.5 401,-18.5 344,-18.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"348\" y=\"-25.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"401,-18.5 401,-37.5 482,-37.5 482,-18.5 401,-18.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"405\" y=\"-25.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"344,0.5 344,-18.5 401,-18.5 401,0.5 344,0.5\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"344,0.5 344,-18.5 401,-18.5 401,0.5 344,0.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"366\" y=\"-6.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edtype\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"401,0.5 401,-18.5 482,-18.5 482,0.5 401,0.5\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"405\" y=\"-6.5\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003ejnp.bfloat16\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M296.03,-111.19C308,-102.83 344.36,-77.43 373.4,-57.15\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge3\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M528.73,-110.99C516.58,-102.44 480.86,-77.28 452.28,-57.16\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.dot.Graph at 0x7fa9fee3d590\u003e"
+ ""
]
},
"execution_count": 18,
@@ -1024,9 +1024,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"550pt\" height=\"194pt\"\n viewBox=\"0.00 0.00 549.50 194.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 190)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-190 545.5,-190 545.5,4 -4,4\"/\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"0,-57 0,-76 132,-76 132,-57 0,-57\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-57 0,-76 132,-76 132,-57 0,-57\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"31.5\" y=\"-65\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"63.5\" y=\"-65\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,-38 0,-57 57,-57 57,-38 0,-38\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-38 0,-57 57,-57 57,-38 0,-38\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4\" y=\"-45\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"57,-38 57,-57 132,-57 132,-38 57,-38\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"61\" y=\"-45\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e4\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,-19 0,-38 57,-38 57,-19 0,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-19 0,-38 57,-38 57,-19 0,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"22\" y=\"-26\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edtype\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"57,-19 57,-38 132,-38 132,-19 57,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"61\" y=\"-26\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003ejnp.float32\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"0,0 0,-19 57,-19 57,0 0,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,0 0,-19 57,-19 57,0 0,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003euse_bias\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"57,0 57,-19 132,-19 132,0 57,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"61\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eFalse\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"transparent\" points=\"9,-167 9,-186 542,-186 542,-167 9,-167\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"9,-167 9,-186 542,-186 542,-167 9,-167\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"226\" y=\"-175\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"258\" y=\"-175\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Sequential\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"9,-112 9,-167 54,-167 54,-112 9,-112\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"9,-112 9,-167 54,-167 54,-112 9,-112\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"13\" y=\"-137\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003elayers\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"54,-112 54,-167 542,-167 542,-112 54,-112\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"58,-144 58,-163 538,-163 538,-144 58,-144\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"58,-144 58,-163 538,-163 538,-144 58,-144\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"285.5\" y=\"-151\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003elist\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"58,-125 58,-144 74,-144 74,-125 58,-125\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"transparent\" points=\"62,-129 62,-140 70,-140 70,-129 62,-129\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"62,-129 62,-140 70,-140 70,-129 62,-129\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"74,-125 74,-144 281,-144 281,-125 74,-125\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"78\" y=\"-132\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function gelu at 0x7faa19d3eef0\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"281,-125 281,-144 297,-144 297,-125 281,-125\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"285,-129 285,-140 293,-140 293,-129 285,-129\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"285,-129 285,-140 293,-140 293,-129 285,-129\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"297,-125 297,-144 522,-144 522,-125 297,-125\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"301\" y=\"-132\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026lt;function softmax at 0x7faa19d3f0e0\u0026gt;\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"522,-125 522,-144 538,-144 538,-125 522,-125\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"526,-129 526,-140 534,-140 534,-129 526,-129\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"526,-129 526,-140 534,-140 534,-129 526,-129\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"58,-116 58,-125 74,-125 74,-116 58,-116\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"58,-116 58,-125 74,-125 74,-116 58,-116\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"64\" y=\"-119.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e0\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"74,-116 74,-125 281,-125 281,-116 74,-116\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"74,-116 74,-125 281,-125 281,-116 74,-116\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"175.5\" y=\"-119.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e1\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"281,-116 281,-125 297,-125 297,-116 281,-116\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"281,-116 281,-125 297,-125 297,-116 281,-116\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"287\" y=\"-119.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e2\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"297,-116 297,-125 522,-125 522,-116 297,-116\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"297,-116 297,-125 522,-125 522,-116 297,-116\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"407.5\" y=\"-119.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e3\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"522,-116 522,-125 538,-125 538,-116 522,-116\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"522,-116 522,-125 538,-125 538,-116 522,-116\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"528\" y=\"-119.2\" font-family=\"Courier,monospace\" font-size=\"6.00\"\u003e4\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M66,-128.96C66,-119.82 66,-96.77 66,-76.29\"/\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"transparent\" points=\"344,-57 344,-76 476,-76 476,-57 344,-57\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"344,-57 344,-76 476,-76 476,-57 344,-57\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"375.5\" y=\"-65\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"407.5\" y=\"-65\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e Dense\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"344,-38 344,-57 401,-57 401,-38 344,-38\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"344,-38 344,-57 401,-57 401,-38 344,-38\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"348\" y=\"-45\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"401,-38 401,-57 476,-57 476,-38 401,-38\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"405\" y=\"-45\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"344,-19 344,-38 401,-38 401,-19 344,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"344,-19 344,-38 401,-38 401,-19 344,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"366\" y=\"-26\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edtype\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"401,-19 401,-38 476,-38 476,-19 401,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"405\" y=\"-26\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003ejnp.float32\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"transparent\" points=\"344,0 344,-19 401,-19 401,0 344,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"344,0 344,-19 401,-19 401,0 344,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"348\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003euse_bias\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"401,0 401,-19 476,-19 476,0 401,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"405\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eFalse\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M293.03,-129.87C303.89,-121.43 334.85,-97.38 362.18,-76.15\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge3\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#000000\" stroke-width=\"3\" stroke-opacity=\"0.188235\" d=\"M525.73,-129.65C514.71,-121.02 484.28,-97.19 457.39,-76.13\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.dot.Graph at 0x7fa9fee3dcd0\u003e"
+ ""
]
},
"execution_count": 19,
@@ -1060,7 +1060,7 @@
"If, when you print out your model, a value is set to an unexpected value, you can easily determine when it got set thanks to the time-travelling debugging infrastructure! `printing.history_per_leaf_parameter` will print out, for each leaf parameter:\n",
"\n",
" 1. the current value,\n",
- " 2. where the current value was set (file (or notebook cell), line number, and function name (or `\u003cmodule\u003e` if set at the top-level) after the `@` sign), and\n",
+ " 2. where the current value was set (file (or notebook cell), line number, and function name (or `` if set at the top-level) after the `@` sign), and\n",
" 3. all previous values (in reverse chronological order) including where they were set.\n",
"\n",
"For additional information, check out the doc-strings for `printing` and each function."
@@ -1089,37 +1089,37 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "layers[0].features = 4 @ \u003cipython-input-14-d5dfc72e0365\u003e:3:\u003cmodule\u003e\n",
- "layers[0].dtype = \u003cclass 'jax._src.numpy.lax_numpy.float32'\u003e @ //fiddle/experimental/selectors.py:107:set\n",
- " - previously: \u003cclass 'jax._src.numpy.lax_numpy.bfloat16'\u003e @ //fiddle/experimental/selectors.py:107:set\n",
+ "layers[0].features = 4 @ :3:\n",
+ "layers[0].dtype = @ //fiddle/experimental/selectors.py:107:set\n",
+ " - previously: @ //fiddle/experimental/selectors.py:107:set\n",
"layers[0].use_bias = False @ //fiddle/experimental/selectors.py:107:set\n",
- "layers[0].bias_init = \u003c[unset]\u003e\n",
- "layers[0].kernel_init = \u003c[unset]\u003e\n",
- "layers[0].name = \u003c[unset]\u003e\n",
- "layers[0].parent = \u003c[unset]\u003e\n",
- "layers[0].precision = \u003c[unset]\u003e\n",
- "layers[1] = \u003cfunction gelu at 0x7faa19d3eef0\u003e\n",
- "layers[2].features = 1 @ \u003cipython-input-14-d5dfc72e0365\u003e:5:\u003cmodule\u003e\n",
- "layers[2].dtype = \u003cclass 'jax._src.numpy.lax_numpy.float32'\u003e @ //fiddle/experimental/selectors.py:107:set\n",
- " - previously: \u003cclass 'jax._src.numpy.lax_numpy.bfloat16'\u003e @ //fiddle/experimental/selectors.py:107:set\n",
+ "layers[0].bias_init = <[unset]>\n",
+ "layers[0].kernel_init = <[unset]>\n",
+ "layers[0].name = <[unset]>\n",
+ "layers[0].parent = <[unset]>\n",
+ "layers[0].precision = <[unset]>\n",
+ "layers[1] = \n",
+ "layers[2].features = 1 @ :5:\n",
+ "layers[2].dtype = @ //fiddle/experimental/selectors.py:107:set\n",
+ " - previously: @ //fiddle/experimental/selectors.py:107:set\n",
"layers[2].use_bias = False @ //fiddle/experimental/selectors.py:107:set\n",
- "layers[2].bias_init = \u003c[unset]\u003e\n",
- "layers[2].kernel_init = \u003c[unset]\u003e\n",
- "layers[2].name = \u003c[unset]\u003e\n",
- "layers[2].parent = \u003c[unset]\u003e\n",
- "layers[2].precision = \u003c[unset]\u003e\n",
- "layers[3] = \u003cfunction softmax at 0x7faa19d3f0e0\u003e\n",
- "layers[4].features = 1 @ \u003cipython-input-14-d5dfc72e0365\u003e:5:\u003cmodule\u003e\n",
- "layers[4].dtype = \u003cclass 'jax._src.numpy.lax_numpy.float32'\u003e @ //fiddle/experimental/selectors.py:107:set\n",
- " - previously: \u003cclass 'jax._src.numpy.lax_numpy.bfloat16'\u003e @ //fiddle/experimental/selectors.py:107:set\n",
+ "layers[2].bias_init = <[unset]>\n",
+ "layers[2].kernel_init = <[unset]>\n",
+ "layers[2].name = <[unset]>\n",
+ "layers[2].parent = <[unset]>\n",
+ "layers[2].precision = <[unset]>\n",
+ "layers[3] = \n",
+ "layers[4].features = 1 @ :5:\n",
+ "layers[4].dtype = @ //fiddle/experimental/selectors.py:107:set\n",
+ " - previously: @ //fiddle/experimental/selectors.py:107:set\n",
"layers[4].use_bias = False @ //fiddle/experimental/selectors.py:107:set\n",
- "layers[4].bias_init = \u003c[unset]\u003e\n",
- "layers[4].kernel_init = \u003c[unset]\u003e\n",
- "layers[4].name = \u003c[unset]\u003e\n",
- "layers[4].parent = \u003c[unset]\u003e\n",
- "layers[4].precision = \u003c[unset]\u003e\n",
- "name = \u003c[unset]\u003e\n",
- "parent = \u003c[unset]\u003e\n"
+ "layers[4].bias_init = <[unset]>\n",
+ "layers[4].kernel_init = <[unset]>\n",
+ "layers[4].name = <[unset]>\n",
+ "layers[4].parent = <[unset]>\n",
+ "layers[4].precision = <[unset]>\n",
+ "name = <[unset]>\n",
+ "parent = <[unset]>\n"
]
}
],
@@ -1137,7 +1137,7 @@
"\n",
"Fiddle configs can be converted into a string that is easily machine-processable by standard unix tools such as `grep` and `diff`. It includes type annotations (if the corresponding classes include them), and also includes all unset parameters and their defaults (if available).\n",
"\n",
- "\u003e Note: this format intentionally flattens out any aliased sub-configurations."
+ "> Note: this format intentionally flattens out any aliased sub-configurations."
]
},
{
@@ -1165,32 +1165,32 @@
"text": [
"layers[0].features: int = 4\n",
"layers[0].use_bias: bool = False\n",
- "layers[0].dtype: typing.Any = \u003cclass 'jax._src.numpy.lax_numpy.float32'\u003e\n",
- "layers[0].precision: typing.Any = \u003c[unset; default: None]\u003e\n",
- "layers[0].kernel_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = \u003c[unset; default: \u003cfunction variance_scaling.\u003clocals\u003e.init at 0x7faa19fb1b00\u003e]\u003e\n",
- "layers[0].bias_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = \u003c[unset; default: \u003cfunction zeros at 0x7faa1a590680\u003e]\u003e\n",
- "layers[0].parent: typing.Union[typing.Type[ForwardRef('Module')], typing.Type[ForwardRef('Scope')], typing.Type[ForwardRef('_Sentinel')], NoneType] = \u003c[unset; default: \u003cflax.linen.module._Sentinel object at 0x7faa19fe4d90\u003e]\u003e\n",
- "layers[0].name: str = \u003c[unset; default: None]\u003e\n",
- "layers[1] = \u003cfunction gelu at 0x7faa19d3eef0\u003e\n",
+ "layers[0].dtype: typing.Any = \n",
+ "layers[0].precision: typing.Any = <[unset; default: None]>\n",
+ "layers[0].kernel_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = <[unset; default: .init at 0x7faa19fb1b00>]>\n",
+ "layers[0].bias_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = <[unset; default: ]>\n",
+ "layers[0].parent: typing.Union[typing.Type[ForwardRef('Module')], typing.Type[ForwardRef('Scope')], typing.Type[ForwardRef('_Sentinel')], NoneType] = <[unset; default: ]>\n",
+ "layers[0].name: str = <[unset; default: None]>\n",
+ "layers[1] = \n",
"layers[2].features: int = 1\n",
"layers[2].use_bias: bool = False\n",
- "layers[2].dtype: typing.Any = \u003cclass 'jax._src.numpy.lax_numpy.float32'\u003e\n",
- "layers[2].precision: typing.Any = \u003c[unset; default: None]\u003e\n",
- "layers[2].kernel_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = \u003c[unset; default: \u003cfunction variance_scaling.\u003clocals\u003e.init at 0x7faa19fb1b00\u003e]\u003e\n",
- "layers[2].bias_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = \u003c[unset; default: \u003cfunction zeros at 0x7faa1a590680\u003e]\u003e\n",
- "layers[2].parent: typing.Union[typing.Type[ForwardRef('Module')], typing.Type[ForwardRef('Scope')], typing.Type[ForwardRef('_Sentinel')], NoneType] = \u003c[unset; default: \u003cflax.linen.module._Sentinel object at 0x7faa19fe4d90\u003e]\u003e\n",
- "layers[2].name: str = \u003c[unset; default: None]\u003e\n",
- "layers[3] = \u003cfunction softmax at 0x7faa19d3f0e0\u003e\n",
+ "layers[2].dtype: typing.Any = \n",
+ "layers[2].precision: typing.Any = <[unset; default: None]>\n",
+ "layers[2].kernel_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = <[unset; default: .init at 0x7faa19fb1b00>]>\n",
+ "layers[2].bias_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = <[unset; default: ]>\n",
+ "layers[2].parent: typing.Union[typing.Type[ForwardRef('Module')], typing.Type[ForwardRef('Scope')], typing.Type[ForwardRef('_Sentinel')], NoneType] = <[unset; default: ]>\n",
+ "layers[2].name: str = <[unset; default: None]>\n",
+ "layers[3] = \n",
"layers[4].features: int = 1\n",
"layers[4].use_bias: bool = False\n",
- "layers[4].dtype: typing.Any = \u003cclass 'jax._src.numpy.lax_numpy.float32'\u003e\n",
- "layers[4].precision: typing.Any = \u003c[unset; default: None]\u003e\n",
- "layers[4].kernel_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = \u003c[unset; default: \u003cfunction variance_scaling.\u003clocals\u003e.init at 0x7faa19fb1b00\u003e]\u003e\n",
- "layers[4].bias_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = \u003c[unset; default: \u003cfunction zeros at 0x7faa1a590680\u003e]\u003e\n",
- "layers[4].parent: typing.Union[typing.Type[ForwardRef('Module')], typing.Type[ForwardRef('Scope')], typing.Type[ForwardRef('_Sentinel')], NoneType] = \u003c[unset; default: \u003cflax.linen.module._Sentinel object at 0x7faa19fe4d90\u003e]\u003e\n",
- "layers[4].name: str = \u003c[unset; default: None]\u003e\n",
- "parent: typing.Union[typing.Type[ForwardRef('Module')], typing.Type[ForwardRef('Scope')], typing.Type[ForwardRef('_Sentinel')], NoneType] = \u003c[unset; default: \u003cflax.linen.module._Sentinel object at 0x7faa19fe4d90\u003e]\u003e\n",
- "name: str = \u003c[unset; default: None]\u003e\n"
+ "layers[4].dtype: typing.Any = \n",
+ "layers[4].precision: typing.Any = <[unset; default: None]>\n",
+ "layers[4].kernel_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = <[unset; default: .init at 0x7faa19fb1b00>]>\n",
+ "layers[4].bias_init: typing.Callable[[typing.Any, typing.Iterable[int], typing.Any], typing.Any] = <[unset; default: ]>\n",
+ "layers[4].parent: typing.Union[typing.Type[ForwardRef('Module')], typing.Type[ForwardRef('Scope')], typing.Type[ForwardRef('_Sentinel')], NoneType] = <[unset; default: ]>\n",
+ "layers[4].name: str = <[unset; default: None]>\n",
+ "parent: typing.Union[typing.Type[ForwardRef('Module')], typing.Type[ForwardRef('Scope')], typing.Type[ForwardRef('_Sentinel')], NoneType] = <[unset; default: ]>\n",
+ "name: str = <[unset; default: None]>\n"
]
}
],
diff --git a/fiddle/examples/colabs/select_and_tag_apis.ipynb b/fiddle/examples/colabs/select_and_tag_apis.ipynb
index f0cdaefe..ece73647 100644
--- a/fiddle/examples/colabs/select_and_tag_apis.ipynb
+++ b/fiddle/examples/colabs/select_and_tag_apis.ipynb
@@ -492,7 +492,7 @@
" \"The requested data-type for module outputs.\"\n",
"\n",
"\n",
- "def base_config() -\u003e fdl.Config[Sequential]:\n",
+ "def base_config() -> fdl.Config[Sequential]:\n",
" add_range = fdl.Config(AddRange, 0, 4,\n",
" ActivationDType.new(default=jnp.float32))\n",
" add_const = fdl.Config(AddConstant, 1,\n",
@@ -520,7 +520,7 @@
},
"outputs": [],
"source": [
- "def experiment_config() -\u003e fdl.Config[Sequential]:\n",
+ "def experiment_config() -> fdl.Config[Sequential]:\n",
" cfg = base_config()\n",
" selectors.select(cfg, tag=ActivationDType).replace(value=jnp.int32)\n",
" return cfg\n",
@@ -617,7 +617,7 @@
" fdl.build(ActivationDType.new())\n",
"except Exception as e:\n",
" name = e.__class__.__name__\n",
- " display(HTML(f'\u003cspan style=\"color: red\"\u003e{name}: {e}\u003c/span\u003e'))\n",
+ " display(HTML(f'{name}: {e}'))\n",
"\n",
"else:\n",
" raise AssertionError(\"Expected an exception to be thrown!\")"
@@ -685,7 +685,7 @@
" \"\"\"DType for final layer neural network computations.\"\"\"\n",
"\n",
"\n",
- "def fine_tag_types_config() -\u003e fdl.Config[Sequential]:\n",
+ "def fine_tag_types_config() -> fdl.Config[Sequential]:\n",
" add_range = fdl.Config(\n",
" AddRange, 0, 4, IntermediateLayerActivationDtype.new(default=jnp.float32))\n",
" add_const = fdl.Config(AddConstant, 1,\n",
@@ -841,9 +841,9 @@
"source": [
"The exception to this is when assigning to subcontainers (e.g., list or dictionary values) and the assignment cannot be detected by Fiddle.\n",
"\n",
- "Second, `select(cfg, tag=\u003ctag\u003e)` checks tags by their class hierarchy; if\n",
+ "Second, `select(cfg, tag=)` checks tags by their class hierarchy; if\n",
"you redefine a Tag class (e.g. by re-running the cell in colab), and have\n",
- "differing Tag classes in `cfg` and `\u003ctag\u003e` arguments, then you will not set the\n",
+ "differing Tag classes in `cfg` and `` arguments, then you will not set the\n",
"value of any tags.\n",
"\n",
"Third, by convention, the `TaggedValue` objects are not shared, only `Tag`s.\n",
diff --git a/fiddle/examples/colabs/visualization_printing_codegen.ipynb b/fiddle/examples/colabs/visualization_printing_codegen.ipynb
index 23ee4173..6d7dc9eb 100644
--- a/fiddle/examples/colabs/visualization_printing_codegen.ipynb
+++ b/fiddle/examples/colabs/visualization_printing_codegen.ipynb
@@ -116,7 +116,7 @@
" jnp.float32,\n",
" )\n",
"\n",
- " def __call__(self, inputs: jnp.ndarray) -\u003e jnp.ndarray:\n",
+ " def __call__(self, inputs: jnp.ndarray) -> jnp.ndarray:\n",
" return jnp.asarray(self.embedding[inputs], self.dtype)\n",
"\n",
"\n",
@@ -125,7 +125,7 @@
" output_features: int\n",
"\n",
" @nn.compact\n",
- " def __call__(self, inputs: jnp.ndarray) -\u003e jnp.ndarray:\n",
+ " def __call__(self, inputs: jnp.ndarray) -> jnp.ndarray:\n",
" embedded = self.token_embedder(inputs)\n",
" return nn.Dense(features=self.output_features)(embedded)\n",
"\n",
@@ -136,13 +136,13 @@
"\n",
" def __call__(self, query, document):\n",
" return jnp.einsum(\n",
- " '...h,...h-\u003e...',\n",
+ " '...h,...h->...',\n",
" self.query_encoder(query),\n",
" self.document_encoder(document),\n",
" )\n",
"\n",
"\n",
- "def base_config() -\u003e fdl.Config[DualEncoder]:\n",
+ "def base_config() -> fdl.Config[DualEncoder]:\n",
" shared_token_embedder = fdl.Config(\n",
" TokenEmbedder,\n",
" num_embeddings=12,\n",
@@ -201,9 +201,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"313pt\" height=\"401pt\"\n viewBox=\"0.00 0.00 313.00 401.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 397)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"none\" points=\"-4,4 -4,-397 309,-397 309,4 -4,4\"/\u003e\n\u003c!-- 3 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e3\u003c/title\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"none\" points=\"162,-76 162,-95 305,-95 305,-76 162,-76\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"162,-76 162,-95 305,-95 305,-76 162,-76\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"166\" y=\"-84\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"198\" y=\"-84\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e variance_scaling\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"162,-57 162,-76 245,-76 245,-57 162,-57\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"162,-57 162,-76 245,-76 245,-57 162,-57\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"210\" y=\"-64\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003escale\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"245,-57 245,-76 305,-76 305,-57 245,-57\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"249\" y=\"-64\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1.0\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"162,-38 162,-57 245,-57 245,-38 162,-38\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"162,-38 162,-57 245,-57 245,-38 162,-38\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"216\" y=\"-45\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003emode\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"245,-38 245,-57 305,-57 305,-38 245,-38\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"249\" y=\"-45\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026#39;fan_in\u0026#39;\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"162,-19 162,-38 245,-38 245,-19 162,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"162,-19 162,-38 245,-38 245,-19 162,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"168\" y=\"-26\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edistribution\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"245,-19 245,-38 305,-38 305,-19 245,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"249\" y=\"-26\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026#39;normal\u0026#39;\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"162,0 162,-19 245,-19 245,0 162,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"162,0 162,-19 245,-19 245,0 162,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"192\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eout_axis\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"245,0 245,-19 305,-19 305,0 245,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"249\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e0\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"none\" points=\"122,-188 122,-207 247,-207 247,-188 122,-188\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"122,-188 122,-207 247,-207 247,-188 122,-188\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"126\" y=\"-196\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"158\" y=\"-196\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e TokenEmbedder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"122,-169 122,-188 220,-188 220,-169 122,-169\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"122,-169 122,-188 220,-188 220,-169 122,-169\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"131\" y=\"-176\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003enum_embeddings\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"220,-169 220,-188 247,-188 247,-169 220,-169\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"224\" y=\"-176\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e12\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"122,-150 122,-169 220,-169 220,-150 122,-150\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"122,-150 122,-169 220,-169 220,-150 122,-150\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"167\" y=\"-157\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"220,-150 220,-169 247,-169 247,-150 220,-150\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"224\" y=\"-157\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e3\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"122,-131 122,-150 220,-150 220,-131 122,-131\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"122,-131 122,-150 220,-150 220,-131 122,-131\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"131\" y=\"-138\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eembedding_init\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"220,-131 220,-150 247,-150 247,-131 220,-131\"/\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"none\" points=\"224,-135 224,-146 243,-146 243,-135 224,-135\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"224,-135 224,-146 243,-146 243,-135 224,-135\"/\u003e\n\u003c/g\u003e\n\u003c!-- 2\u0026#45;\u0026#45;3 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e2:c\u0026#45;\u0026#45;3:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#cb8061\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M233.5,-135.11C233.5,-127.8 233.5,-111.25 233.5,-94.55\"/\u003e\n\u003c/g\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"none\" points=\"0,-281 0,-300 125,-300 125,-281 0,-281\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-281 0,-300 125,-300 125,-281 0,-281\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4\" y=\"-289\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"36\" y=\"-289\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleEncoder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"0,-262 0,-281 101,-281 101,-262 0,-262\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-262 0,-281 101,-281 101,-262 0,-262\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"12\" y=\"-269\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003etoken_embedder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"101,-262 101,-281 125,-281 125,-262 101,-262\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"none\" points=\"105,-266 105,-277 121,-277 121,-266 105,-266\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"105,-266 105,-277 121,-277 121,-266 105,-266\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"0,-243 0,-262 101,-262 101,-243 0,-243\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-243 0,-262 101,-262 101,-243 0,-243\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"6\" y=\"-250\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eoutput_features\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"101,-243 101,-262 125,-262 125,-243 101,-243\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"105\" y=\"-250\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e12\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 1\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e1:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#cbc6b0\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M116.55,-266.18C123.77,-255.96 142.5,-229.46 158.47,-206.85\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node4\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"none\" points=\"20,-374 20,-393 141,-393 141,-374 20,-374\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"20,-374 20,-393 141,-393 141,-374 20,-374\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"28\" y=\"-382\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"60\" y=\"-382\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e DualEncoder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"20,-355 20,-374 125,-374 125,-355 20,-355\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"20,-355 20,-374 125,-374 125,-355 20,-355\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"42\" y=\"-362\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003equery_encoder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"125,-355 125,-374 141,-374 141,-355 125,-355\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"none\" points=\"129,-359 129,-370 137,-370 137,-359 129,-359\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"129,-359 129,-370 137,-370 137,-359 129,-359\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"20,-336 20,-355 125,-355 125,-336 20,-336\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"20,-336 20,-355 125,-355 125,-336 20,-336\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"24\" y=\"-343\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edocument_encoder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"125,-336 125,-355 141,-355 141,-336 125,-336\"/\u003e\n\u003cpolygon fill=\"#add8e6\" stroke=\"none\" points=\"129,-340 129,-351 137,-351 137,-340 129,-340\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"129,-340 129,-351 137,-351 137,-340 129,-340\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge3\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#73be73\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M130.08,-359.11C121.82,-348.53 100.28,-320.93 83.72,-299.7\"/\u003e\n\u003c/g\u003e\n\u003c!-- 4 --\u003e\n\u003cg id=\"node5\" class=\"node\"\u003e\n\u003ctitle\u003e4\u003c/title\u003e\n\u003cpolygon fill=\"#add8e6\" stroke=\"none\" points=\"143,-281 143,-300 268,-300 268,-281 143,-281\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"143,-281 143,-300 268,-300 268,-281 143,-281\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"147\" y=\"-289\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"179\" y=\"-289\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleEncoder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"143,-262 143,-281 244,-281 244,-262 143,-262\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"143,-262 143,-281 244,-281 244,-262 143,-262\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"155\" y=\"-269\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003etoken_embedder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"244,-262 244,-281 268,-281 268,-262 244,-262\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"none\" points=\"248,-266 248,-277 264,-277 264,-266 248,-266\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"248,-266 248,-277 264,-277 264,-266 248,-266\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"143,-243 143,-262 244,-262 244,-243 143,-243\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"143,-243 143,-262 244,-262 244,-243 143,-243\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"149\" y=\"-250\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eoutput_features\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"244,-243 244,-262 268,-262 268,-243 244,-243\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"248\" y=\"-250\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e12\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;4 --\u003e\n\u003cg id=\"edge5\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;4:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#8aacb7\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M136.97,-341.03C144.39,-333.61 162.38,-315.62 178.06,-299.94\"/\u003e\n\u003c/g\u003e\n\u003c!-- 4\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge4\" class=\"edge\"\u003e\n\u003ctitle\u003e4:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#cbc6b0\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M253.41,-266.18C246.08,-255.96 227.1,-229.46 210.9,-206.85\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.graphs.Graph at 0x7fd244d6aaa0\u003e"
+ ""
]
},
"execution_count": 3,
@@ -249,9 +249,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"311pt\" height=\"420pt\"\n viewBox=\"0.00 0.00 311.00 420.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 416)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"none\" points=\"-4,4 -4,-416 307,-416 307,4 -4,4\"/\u003e\n\u003c!-- 3 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e3\u003c/title\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"none\" points=\"160,-76 160,-95 303,-95 303,-76 160,-76\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"160,-76 160,-95 303,-95 303,-76 160,-76\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"164\" y=\"-84\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"196\" y=\"-84\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e variance_scaling\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"160,-57 160,-76 243,-76 243,-57 160,-57\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"160,-57 160,-76 243,-76 243,-57 160,-57\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"208\" y=\"-64\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003escale\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"243,-57 243,-76 303,-76 303,-57 243,-57\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"247\" y=\"-64\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1.0\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"160,-38 160,-57 243,-57 243,-38 160,-38\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"160,-38 160,-57 243,-57 243,-38 160,-38\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"214\" y=\"-45\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003emode\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"243,-38 243,-57 303,-57 303,-38 243,-38\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"247\" y=\"-45\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026#39;fan_in\u0026#39;\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"160,-19 160,-38 243,-38 243,-19 160,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"160,-19 160,-38 243,-38 243,-19 160,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"166\" y=\"-26\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edistribution\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"243,-19 243,-38 303,-38 303,-19 243,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"247\" y=\"-26\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026#39;normal\u0026#39;\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"160,0 160,-19 243,-19 243,0 160,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"160,0 160,-19 243,-19 243,0 160,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"190\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eout_axis\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"243,0 243,-19 303,-19 303,0 243,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"247\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e0\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"none\" points=\"97.5,-207 97.5,-226 271.5,-226 271.5,-207 97.5,-207\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"97.5,-207 97.5,-226 271.5,-226 271.5,-207 97.5,-207\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"126\" y=\"-215\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"158\" y=\"-215\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e TokenEmbedder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"97.5,-188 97.5,-207 190.5,-207 190.5,-188 97.5,-188\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"97.5,-188 97.5,-207 190.5,-207 190.5,-188 97.5,-188\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"101.5\" y=\"-195\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003enum_embeddings\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"190.5,-188 190.5,-207 271.5,-207 271.5,-188 190.5,-188\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"194.5\" y=\"-195\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e12\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"97.5,-169 97.5,-188 190.5,-188 190.5,-169 97.5,-169\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"97.5,-169 97.5,-188 190.5,-188 190.5,-169 97.5,-169\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"137.5\" y=\"-176\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"190.5,-169 190.5,-188 271.5,-188 271.5,-169 190.5,-169\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"194.5\" y=\"-176\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e3\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"97.5,-150 97.5,-169 190.5,-169 190.5,-150 97.5,-150\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"97.5,-150 97.5,-169 190.5,-169 190.5,-150 97.5,-150\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"101.5\" y=\"-157\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eembedding_init\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"190.5,-150 190.5,-169 271.5,-169 271.5,-150 190.5,-150\"/\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"none\" points=\"194.5,-154 194.5,-165 267.5,-165 267.5,-154 194.5,-154\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"194.5,-154 194.5,-165 267.5,-165 267.5,-154 194.5,-154\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"97.5,-131 97.5,-150 190.5,-150 190.5,-131 97.5,-131\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"97.5,-131 97.5,-150 190.5,-150 190.5,-131 97.5,-131\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"155.5\" y=\"-138\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edtype\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"190.5,-131 190.5,-150 271.5,-150 271.5,-131 190.5,-131\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"194.5\" y=\"-138\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003ejnp.bfloat16\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 2\u0026#45;\u0026#45;3 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e2:c\u0026#45;\u0026#45;3:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#cb8061\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M231.5,-154.05C231.5,-143.96 231.5,-118.4 231.5,-94.96\"/\u003e\n\u003c/g\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"none\" points=\"0,-300 0,-319 125,-319 125,-300 0,-300\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-300 0,-319 125,-319 125,-300 0,-300\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4\" y=\"-308\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"36\" y=\"-308\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleEncoder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"0,-281 0,-300 101,-300 101,-281 0,-281\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-281 0,-300 101,-300 101,-281 0,-281\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"12\" y=\"-288\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003etoken_embedder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"101,-281 101,-300 125,-300 125,-281 101,-281\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"none\" points=\"105,-285 105,-296 121,-296 121,-285 105,-285\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"105,-285 105,-296 121,-296 121,-285 105,-285\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"0,-262 0,-281 101,-281 101,-262 0,-262\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-262 0,-281 101,-281 101,-262 0,-262\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"6\" y=\"-269\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eoutput_features\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"101,-262 101,-281 125,-281 125,-262 101,-262\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"105\" y=\"-269\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e12\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 1\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e1:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#cbc6b0\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M116.37,-285.05C122.88,-274.96 139.38,-249.4 154.51,-225.96\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node4\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"none\" points=\"20,-393 20,-412 141,-412 141,-393 20,-393\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"20,-393 20,-412 141,-412 141,-393 20,-393\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"28\" y=\"-401\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"60\" y=\"-401\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e DualEncoder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"20,-374 20,-393 125,-393 125,-374 20,-374\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"20,-374 20,-393 125,-393 125,-374 20,-374\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"42\" y=\"-381\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003equery_encoder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"125,-374 125,-393 141,-393 141,-374 125,-374\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"none\" points=\"129,-378 129,-389 137,-389 137,-378 129,-378\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"129,-378 129,-389 137,-389 137,-378 129,-378\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"20,-355 20,-374 125,-374 125,-355 20,-355\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"20,-355 20,-374 125,-374 125,-355 20,-355\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"24\" y=\"-362\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edocument_encoder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"125,-355 125,-374 141,-374 141,-355 125,-355\"/\u003e\n\u003cpolygon fill=\"#add8e6\" stroke=\"none\" points=\"129,-359 129,-370 137,-370 137,-359 129,-359\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"129,-359 129,-370 137,-370 137,-359 129,-359\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge3\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#73be73\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M130.08,-378.11C121.82,-367.53 100.28,-339.93 83.72,-318.7\"/\u003e\n\u003c/g\u003e\n\u003c!-- 4 --\u003e\n\u003cg id=\"node5\" class=\"node\"\u003e\n\u003ctitle\u003e4\u003c/title\u003e\n\u003cpolygon fill=\"#add8e6\" stroke=\"none\" points=\"143,-300 143,-319 268,-319 268,-300 143,-300\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"143,-300 143,-319 268,-319 268,-300 143,-300\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"147\" y=\"-308\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"179\" y=\"-308\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleEncoder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"143,-281 143,-300 244,-300 244,-281 143,-281\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"143,-281 143,-300 244,-300 244,-281 143,-281\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"155\" y=\"-288\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003etoken_embedder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"244,-281 244,-300 268,-300 268,-281 244,-281\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"none\" points=\"248,-285 248,-296 264,-296 264,-285 248,-285\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"248,-285 248,-296 264,-296 264,-285 248,-285\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"143,-262 143,-281 244,-281 244,-262 143,-262\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"143,-262 143,-281 244,-281 244,-262 143,-262\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"149\" y=\"-269\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eoutput_features\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"244,-262 244,-281 268,-281 268,-262 244,-262\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"248\" y=\"-269\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e12\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;4 --\u003e\n\u003cg id=\"edge5\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;4:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#8aacb7\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M136.97,-360.03C144.39,-352.61 162.38,-334.62 178.06,-318.94\"/\u003e\n\u003c/g\u003e\n\u003c!-- 4\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge4\" class=\"edge\"\u003e\n\u003ctitle\u003e4:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#cbc6b0\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M253.59,-285.05C246.98,-274.96 230.25,-249.4 214.91,-225.96\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.graphs.Graph at 0x7fd244d69720\u003e"
+ ""
]
},
"execution_count": 4,
@@ -272,7 +272,7 @@
},
"source": [
"You'll notice that this is nicely rendered as `jnp.bfloat16` instead of its\n",
- "`repr()` string, `\u003cclass 'jax._src.numpy.lax_numpy.bfloat16'\u003e`; this is because\n",
+ "`repr()` string, ``; this is because\n",
"we called `fiddle.extensions.jax.enable()` in the beginning of this colab.\n",
"However, these JAX extensions are not necessary for graphviz to work."
]
@@ -313,9 +313,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"324pt\" height=\"420pt\"\n viewBox=\"0.00 0.00 323.50 420.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 416)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"none\" points=\"-4,4 -4,-416 319.5,-416 319.5,4 -4,4\"/\u003e\n\u003c!-- 3 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e3\u003c/title\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"none\" points=\"172.5,-76 172.5,-95 315.5,-95 315.5,-76 172.5,-76\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"172.5,-76 172.5,-95 315.5,-95 315.5,-76 172.5,-76\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"176.5\" y=\"-84\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"208.5\" y=\"-84\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e variance_scaling\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"172.5,-57 172.5,-76 255.5,-76 255.5,-57 172.5,-57\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"172.5,-57 172.5,-76 255.5,-76 255.5,-57 172.5,-57\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"220.5\" y=\"-64\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003escale\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"255.5,-57 255.5,-76 315.5,-76 315.5,-57 255.5,-57\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"259.5\" y=\"-64\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e1.0\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"172.5,-38 172.5,-57 255.5,-57 255.5,-38 172.5,-38\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"172.5,-38 172.5,-57 255.5,-57 255.5,-38 172.5,-38\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"226.5\" y=\"-45\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003emode\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"255.5,-38 255.5,-57 315.5,-57 315.5,-38 255.5,-38\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"259.5\" y=\"-45\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026#39;fan_in\u0026#39;\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"172.5,-19 172.5,-38 255.5,-38 255.5,-19 172.5,-19\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"172.5,-19 172.5,-38 255.5,-38 255.5,-19 172.5,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"178.5\" y=\"-26\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edistribution\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"255.5,-19 255.5,-38 315.5,-38 315.5,-19 255.5,-19\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"259.5\" y=\"-26\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e\u0026#39;normal\u0026#39;\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"172.5,0 172.5,-19 255.5,-19 255.5,0 172.5,0\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"172.5,0 172.5,-19 255.5,-19 255.5,0 172.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"202.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eout_axis\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"255.5,0 255.5,-19 315.5,-19 315.5,0 255.5,0\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"259.5\" y=\"-7\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e0\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"none\" points=\"110,-207 110,-226 284,-226 284,-207 110,-207\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"110,-207 110,-226 284,-226 284,-207 110,-207\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"138.5\" y=\"-215\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"170.5\" y=\"-215\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e TokenEmbedder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"110,-188 110,-207 203,-207 203,-188 110,-188\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"110,-188 110,-207 203,-207 203,-188 110,-188\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"114\" y=\"-195\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003enum_embeddings\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"203,-188 203,-207 284,-207 284,-188 203,-188\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"207\" y=\"-195\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e12\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"110,-169 110,-188 203,-188 203,-169 110,-169\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"110,-169 110,-188 203,-188 203,-169 110,-169\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"150\" y=\"-176\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003efeatures\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"203,-169 203,-188 284,-188 284,-169 203,-169\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"207\" y=\"-176\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e3\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"110,-150 110,-169 203,-169 203,-150 110,-150\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"110,-150 110,-169 203,-169 203,-150 110,-150\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"114\" y=\"-157\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eembedding_init\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"203,-150 203,-169 284,-169 284,-150 203,-150\"/\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"none\" points=\"207,-154 207,-165 280,-165 280,-154 207,-154\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"207,-154 207,-165 280,-165 280,-154 207,-154\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"110,-131 110,-150 203,-150 203,-131 110,-131\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"110,-131 110,-150 203,-150 203,-131 110,-131\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"168\" y=\"-138\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edtype\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"203,-131 203,-150 284,-150 284,-131 203,-131\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"207\" y=\"-138\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003ejnp.bfloat16\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 2\u0026#45;\u0026#45;3 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e2:c\u0026#45;\u0026#45;3:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#cb8061\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M244,-154.05C244,-143.96 244,-118.4 244,-94.96\"/\u003e\n\u003c/g\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"none\" points=\"83.5,-300 83.5,-319 208.5,-319 208.5,-300 83.5,-300\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"83.5,-300 83.5,-319 208.5,-319 208.5,-300 83.5,-300\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"87.5\" y=\"-308\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"119.5\" y=\"-308\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleEncoder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"83.5,-281 83.5,-300 184.5,-300 184.5,-281 83.5,-281\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"83.5,-281 83.5,-300 184.5,-300 184.5,-281 83.5,-281\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"95.5\" y=\"-288\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003etoken_embedder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"184.5,-281 184.5,-300 208.5,-300 208.5,-281 184.5,-281\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"none\" points=\"188.5,-285 188.5,-296 204.5,-296 204.5,-285 188.5,-285\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"188.5,-285 188.5,-296 204.5,-296 204.5,-285 188.5,-285\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"83.5,-262 83.5,-281 184.5,-281 184.5,-262 83.5,-262\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"83.5,-262 83.5,-281 184.5,-281 184.5,-262 83.5,-262\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"89.5\" y=\"-269\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eoutput_features\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"184.5,-262 184.5,-281 208.5,-281 208.5,-262 184.5,-262\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"188.5\" y=\"-269\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e12\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 1\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e1:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#cbc6b0\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M197,-285.05C197,-274.96 197,-249.4 197,-225.96\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node4\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"none\" points=\"0,-393 0,-412 186,-412 186,-393 0,-393\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-393 0,-412 186,-412 186,-393 0,-393\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"40.5\" y=\"-401\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"72.5\" y=\"-401\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e DualEncoder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"0,-374 0,-393 105,-393 105,-374 0,-374\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-374 0,-393 105,-393 105,-374 0,-374\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"22\" y=\"-381\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003equery_encoder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"105,-374 105,-393 186,-393 186,-374 105,-374\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"none\" points=\"109,-378 109,-389 182,-389 182,-378 109,-378\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"109,-378 109,-389 182,-389 182,-378 109,-378\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"0,-355 0,-374 105,-374 105,-355 0,-355\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-355 0,-374 105,-374 105,-355 0,-355\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4\" y=\"-362\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edocument_encoder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"105,-355 105,-374 186,-374 186,-355 105,-355\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"109\" y=\"-363\" font-family=\"Courier,monospace\" font-style=\"italic\" font-size=\"10.00\"\u003e(trimmed...)\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge3\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#73be73\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M146,-378.11C146,-367.53 146,-339.93 146,-318.7\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.graphs.Graph at 0x7fd244d68850\u003e"
+ ""
]
},
"execution_count": 5,
@@ -362,9 +362,9 @@
"outputs": [
{
"data": {
- "image/svg+xml": "\u003c?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?\u003e\n\u003c!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\"\u003e\n\u003c!-- Generated by graphviz version 2.44.1 (20201121.0304)\n --\u003e\n\u003c!-- Pages: 1 --\u003e\n\u003csvg width=\"276pt\" height=\"230pt\"\n viewBox=\"0.00 0.00 276.00 230.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\"\u003e\n\u003cg id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 226)\"\u003e\n\u003cpolygon fill=\"white\" stroke=\"none\" points=\"-4,4 -4,-226 272,-226 272,4 -4,4\"/\u003e\n\u003c!-- 2 --\u003e\n\u003cg id=\"node1\" class=\"node\"\u003e\n\u003ctitle\u003e2\u003c/title\u003e\n\u003ctext text-anchor=\"start\" x=\"148\" y=\"-16.5\" font-family=\"Courier,monospace\" font-style=\"italic\" font-size=\"10.00\"\u003e(trimmed...)\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 1 --\u003e\n\u003cg id=\"node2\" class=\"node\"\u003e\n\u003ctitle\u003e1\u003c/title\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"none\" points=\"0,-110 0,-129 125,-129 125,-110 0,-110\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-110 0,-129 125,-129 125,-110 0,-110\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"4\" y=\"-118\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"36\" y=\"-118\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleEncoder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"0,-91 0,-110 101,-110 101,-91 0,-91\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-91 0,-110 101,-110 101,-91 0,-91\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"12\" y=\"-98\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003etoken_embedder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"101,-91 101,-110 125,-110 125,-91 101,-91\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"none\" points=\"105,-95 105,-106 121,-106 121,-95 105,-95\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"105,-95 105,-106 121,-106 121,-95 105,-95\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"0,-72 0,-91 101,-91 101,-72 0,-72\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"0,-72 0,-91 101,-91 101,-72 0,-72\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"6\" y=\"-79\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eoutput_features\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"101,-72 101,-91 125,-91 125,-72 101,-72\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"105\" y=\"-79\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e12\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 1\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge1\" class=\"edge\"\u003e\n\u003ctitle\u003e1:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#cbc6b0\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M116.64,-95.1C120.63,-89.58 127.81,-79.87 134.5,-72 145.15,-59.47 157.87,-46 167.82,-35.77\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0 --\u003e\n\u003cg id=\"node3\" class=\"node\"\u003e\n\u003ctitle\u003e0\u003c/title\u003e\n\u003cpolygon fill=\"#ffc0cb\" stroke=\"none\" points=\"20,-203 20,-222 141,-222 141,-203 20,-203\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"20,-203 20,-222 141,-222 141,-203 20,-203\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"28\" y=\"-211\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"60\" y=\"-211\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e DualEncoder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"20,-184 20,-203 125,-203 125,-184 20,-184\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"20,-184 20,-203 125,-203 125,-184 20,-184\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"42\" y=\"-191\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003equery_encoder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"125,-184 125,-203 141,-203 141,-184 125,-184\"/\u003e\n\u003cpolygon fill=\"#90ee90\" stroke=\"none\" points=\"129,-188 129,-199 137,-199 137,-188 129,-188\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"129,-188 129,-199 137,-199 137,-188 129,-188\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"20,-165 20,-184 125,-184 125,-165 20,-165\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"20,-165 20,-184 125,-184 125,-165 20,-165\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"24\" y=\"-172\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003edocument_encoder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"125,-165 125,-184 141,-184 141,-165 125,-165\"/\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"none\" points=\"129,-169 129,-180 137,-180 137,-169 129,-169\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"129,-169 129,-180 137,-180 137,-169 129,-169\"/\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;1 --\u003e\n\u003cg id=\"edge2\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;1:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#73be73\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M130.08,-188.11C121.82,-177.53 100.28,-149.93 83.72,-128.7\"/\u003e\n\u003c/g\u003e\n\u003c!-- 3 --\u003e\n\u003cg id=\"node4\" class=\"node\"\u003e\n\u003ctitle\u003e3\u003c/title\u003e\n\u003cpolygon fill=\"#ffa07a\" stroke=\"none\" points=\"143,-110 143,-129 268,-129 268,-110 143,-110\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"143,-110 143,-129 268,-129 268,-110 143,-110\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"147\" y=\"-118\" font-family=\"Courier,monospace\" font-size=\"8.00\"\u003eConfig:\u003c/text\u003e\n\u003ctext text-anchor=\"start\" x=\"179\" y=\"-118\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e SimpleEncoder\u003c/text\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"143,-91 143,-110 244,-110 244,-91 143,-91\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"143,-91 143,-110 244,-110 244,-91 143,-91\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"155\" y=\"-98\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003etoken_embedder\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"244,-91 244,-110 268,-110 268,-91 244,-91\"/\u003e\n\u003cpolygon fill=\"#fff8dc\" stroke=\"none\" points=\"248,-95 248,-106 264,-106 264,-95 248,-95\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"248,-95 248,-106 264,-106 264,-95 248,-95\"/\u003e\n\u003cpolygon fill=\"#eeeeee\" stroke=\"none\" points=\"143,-72 143,-91 244,-91 244,-72 143,-72\"/\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"143,-72 143,-91 244,-91 244,-72 143,-72\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"149\" y=\"-79\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003eoutput_features\u003c/text\u003e\n\u003cpolygon fill=\"none\" stroke=\"black\" points=\"244,-72 244,-91 268,-91 268,-72 244,-72\"/\u003e\n\u003ctext text-anchor=\"start\" x=\"248\" y=\"-79\" font-family=\"Courier,monospace\" font-size=\"10.00\"\u003e12\u003c/text\u003e\n\u003c/g\u003e\n\u003c!-- 0\u0026#45;\u0026#45;3 --\u003e\n\u003cg id=\"edge4\" class=\"edge\"\u003e\n\u003ctitle\u003e0:c\u0026#45;\u0026#45;3:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#cb8061\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M136.97,-170.03C144.39,-162.61 162.38,-144.62 178.06,-128.94\"/\u003e\n\u003c/g\u003e\n\u003c!-- 3\u0026#45;\u0026#45;2 --\u003e\n\u003cg id=\"edge3\" class=\"edge\"\u003e\n\u003ctitle\u003e3:c\u0026#45;\u0026#45;2:c\u003c/title\u003e\n\u003cpath fill=\"none\" stroke=\"#cbc6b0\" stroke-width=\"3\" stroke-opacity=\"0.501961\" d=\"M252.63,-95.17C242.81,-84.2 216.54,-54.82 199.64,-35.92\"/\u003e\n\u003c/g\u003e\n\u003c/g\u003e\n\u003c/svg\u003e\n",
+ "image/svg+xml": "\n\n\n\n\n",
"text/plain": [
- "\u003cgraphviz.graphs.Graph at 0x7fd244d684c0\u003e"
+ ""
]
},
"execution_count": 6,
@@ -415,7 +415,7 @@
"//# sourceURL=js_160fff874c"
],
"text/plain": [
- "\u003cIPython.core.display.Javascript object\u003e"
+ ""
]
},
"metadata": {},
@@ -425,27 +425,27 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "\u003cConfig[DualEncoder(\n",
- " query_encoder=\u003cConfig[SimpleEncoder(\n",
- " token_embedder=\u003cConfig[TokenEmbedder(\n",
+ ")]>,\n",
+ " output_features=12)]>,\n",
+ " document_encoder=)]>,\n",
+ " output_features=12)]>)]>\n"
]
}
],
@@ -493,33 +493,33 @@
"query_encoder.token_embedder.embedding_init.scale: typing.Any = 1.0\n",
"query_encoder.token_embedder.embedding_init.mode: typing.Union[typing.Literal['fan_in'], typing.Literal['fan_out'], typing.Literal['fan_avg']] = 'fan_in'\n",
"query_encoder.token_embedder.embedding_init.distribution: typing.Union[typing.Literal['truncated_normal'], typing.Literal['normal'], typing.Literal['uniform']] = 'normal'\n",
- "query_encoder.token_embedder.embedding_init.in_axis: typing.Union[int, typing.Sequence[int]] = \u003c[unset; default: -2]\u003e\n",
+ "query_encoder.token_embedder.embedding_init.in_axis: typing.Union[int, typing.Sequence[int]] = <[unset; default: -2]>\n",
"query_encoder.token_embedder.embedding_init.out_axis: typing.Union[int, typing.Sequence[int]] = 0\n",
- "query_encoder.token_embedder.embedding_init.batch_axis: typing.Sequence[int] = \u003c[unset; default: ()]\u003e\n",
- "query_encoder.token_embedder.embedding_init.dtype: typing.Any = \u003c[unset; default: jnp.float64]\u003e\n",
- "query_encoder.token_embedder.dtype: typing.Any = \u003c[unset; default: jnp.float32]\u003e\n",
- "query_encoder.token_embedder.parent: typing.Union[typing.Type[flax.linen.module.Module], typing.Type[flax.core.scope.Scope], typing.Type[flax.linen.module._Sentinel], NoneType] = \u003c[unset; default: \u003cflax.linen.module._Sentinel object at 0x7fd244d616f0\u003e]\u003e\n",
- "query_encoder.token_embedder.name: typing.Optional[str] = \u003c[unset; default: None]\u003e\n",
+ "query_encoder.token_embedder.embedding_init.batch_axis: typing.Sequence[int] = <[unset; default: ()]>\n",
+ "query_encoder.token_embedder.embedding_init.dtype: typing.Any = <[unset; default: jnp.float64]>\n",
+ "query_encoder.token_embedder.dtype: typing.Any = <[unset; default: jnp.float32]>\n",
+ "query_encoder.token_embedder.parent: typing.Union[typing.Type[flax.linen.module.Module], typing.Type[flax.core.scope.Scope], typing.Type[flax.linen.module._Sentinel], NoneType] = <[unset; default: ]>\n",
+ "query_encoder.token_embedder.name: typing.Optional[str] = <[unset; default: None]>\n",
"query_encoder.output_features: int = 12\n",
- "query_encoder.parent: typing.Union[typing.Type[flax.linen.module.Module], typing.Type[flax.core.scope.Scope], typing.Type[flax.linen.module._Sentinel], NoneType] = \u003c[unset; default: \u003cflax.linen.module._Sentinel object at 0x7fd244d616f0\u003e]\u003e\n",
- "query_encoder.name: typing.Optional[str] = \u003c[unset; default: None]\u003e\n",
+ "query_encoder.parent: typing.Union[typing.Type[flax.linen.module.Module], typing.Type[flax.core.scope.Scope], typing.Type[flax.linen.module._Sentinel], NoneType] = <[unset; default: ]>\n",
+ "query_encoder.name: typing.Optional[str] = <[unset; default: None]>\n",
"document_encoder.token_embedder.num_embeddings: int = 12\n",
"document_encoder.token_embedder.features: int = 3\n",
"document_encoder.token_embedder.embedding_init.scale: typing.Any = 1.0\n",
"document_encoder.token_embedder.embedding_init.mode: typing.Union[typing.Literal['fan_in'], typing.Literal['fan_out'], typing.Literal['fan_avg']] = 'fan_in'\n",
"document_encoder.token_embedder.embedding_init.distribution: typing.Union[typing.Literal['truncated_normal'], typing.Literal['normal'], typing.Literal['uniform']] = 'normal'\n",
- "document_encoder.token_embedder.embedding_init.in_axis: typing.Union[int, typing.Sequence[int]] = \u003c[unset; default: -2]\u003e\n",
+ "document_encoder.token_embedder.embedding_init.in_axis: typing.Union[int, typing.Sequence[int]] = <[unset; default: -2]>\n",
"document_encoder.token_embedder.embedding_init.out_axis: typing.Union[int, typing.Sequence[int]] = 0\n",
- "document_encoder.token_embedder.embedding_init.batch_axis: typing.Sequence[int] = \u003c[unset; default: ()]\u003e\n",
- "document_encoder.token_embedder.embedding_init.dtype: typing.Any = \u003c[unset; default: jnp.float64]\u003e\n",
- "document_encoder.token_embedder.dtype: typing.Any = \u003c[unset; default: jnp.float32]\u003e\n",
- "document_encoder.token_embedder.parent: typing.Union[typing.Type[flax.linen.module.Module], typing.Type[flax.core.scope.Scope], typing.Type[flax.linen.module._Sentinel], NoneType] = \u003c[unset; default: \u003cflax.linen.module._Sentinel object at 0x7fd244d616f0\u003e]\u003e\n",
- "document_encoder.token_embedder.name: typing.Optional[str] = \u003c[unset; default: None]\u003e\n",
+ "document_encoder.token_embedder.embedding_init.batch_axis: typing.Sequence[int] = <[unset; default: ()]>\n",
+ "document_encoder.token_embedder.embedding_init.dtype: typing.Any = <[unset; default: jnp.float64]>\n",
+ "document_encoder.token_embedder.dtype: typing.Any = <[unset; default: jnp.float32]>\n",
+ "document_encoder.token_embedder.parent: typing.Union[typing.Type[flax.linen.module.Module], typing.Type[flax.core.scope.Scope], typing.Type[flax.linen.module._Sentinel], NoneType] = <[unset; default: ]>\n",
+ "document_encoder.token_embedder.name: typing.Optional[str] = <[unset; default: None]>\n",
"document_encoder.output_features: int = 12\n",
- "document_encoder.parent: typing.Union[typing.Type[flax.linen.module.Module], typing.Type[flax.core.scope.Scope], typing.Type[flax.linen.module._Sentinel], NoneType] = \u003c[unset; default: \u003cflax.linen.module._Sentinel object at 0x7fd244d616f0\u003e]\u003e\n",
- "document_encoder.name: typing.Optional[str] = \u003c[unset; default: None]\u003e\n",
- "parent: typing.Union[typing.Type[flax.linen.module.Module], typing.Type[flax.core.scope.Scope], typing.Type[flax.linen.module._Sentinel], NoneType] = \u003c[unset; default: \u003cflax.linen.module._Sentinel object at 0x7fd244d616f0\u003e]\u003e\n",
- "name: typing.Optional[str] = \u003c[unset; default: None]\u003e\n"
+ "document_encoder.parent: typing.Union[typing.Type[flax.linen.module.Module], typing.Type[flax.core.scope.Scope], typing.Type[flax.linen.module._Sentinel], NoneType] = <[unset; default: ]>\n",
+ "document_encoder.name: typing.Optional[str] = <[unset; default: None]>\n",
+ "parent: typing.Union[typing.Type[flax.linen.module.Module], typing.Type[flax.core.scope.Scope], typing.Type[flax.linen.module._Sentinel], NoneType] = <[unset; default: ]>\n",
+ "name: typing.Optional[str] = <[unset; default: None]>\n"
]
}
],
@@ -566,47 +566,47 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "__fn_or_cls__ = \u003cclass '__main__.DualEncoder'\u003e @ \u003cipython-input-2-1c737bdff90c\u003e:56:base_config\n",
- "query_encoder.__fn_or_cls__ = \u003cclass '__main__.SimpleEncoder'\u003e @ \u003cipython-input-2-1c737bdff90c\u003e:58:base_config\n",
- "query_encoder.token_embedder.__fn_or_cls__ = \u003cclass '__main__.TokenEmbedder'\u003e @ \u003cipython-input-2-1c737bdff90c\u003e:49:base_config\n",
- "query_encoder.token_embedder.num_embeddings = 40 @ \u003cipython-input-9-1e867d8d9c8e\u003e:3:experiment_config\n",
- " - previously: 12 @ \u003cipython-input-2-1c737bdff90c\u003e:49:base_config\n",
- "query_encoder.token_embedder.features = 3 @ \u003cipython-input-2-1c737bdff90c\u003e:49:base_config\n",
- "query_encoder.token_embedder.embedding_init.__fn_or_cls__ = \u003cfunction variance_scaling at 0x7fd277681cf0\u003e @ \u003cipython-input-2-1c737bdff90c\u003e:53:base_config\n",
- "query_encoder.token_embedder.embedding_init.scale = 1.0 @ \u003cipython-input-2-1c737bdff90c\u003e:53:base_config\n",
- "query_encoder.token_embedder.embedding_init.mode = 'fan_in' @ \u003cipython-input-2-1c737bdff90c\u003e:53:base_config\n",
- "query_encoder.token_embedder.embedding_init.distribution = 'normal' @ \u003cipython-input-2-1c737bdff90c\u003e:53:base_config\n",
- "query_encoder.token_embedder.embedding_init.out_axis = 0 @ \u003cipython-input-2-1c737bdff90c\u003e:53:base_config\n",
- "query_encoder.token_embedder.embedding_init.batch_axis = \u003c[unset]\u003e\n",
- "query_encoder.token_embedder.embedding_init.dtype = \u003c[unset]\u003e\n",
- "query_encoder.token_embedder.embedding_init.in_axis = \u003c[unset]\u003e\n",
- "query_encoder.token_embedder.dtype = \u003c[unset]\u003e\n",
- "query_encoder.token_embedder.name = \u003c[unset]\u003e\n",
- "query_encoder.token_embedder.parent = \u003c[unset]\u003e\n",
- "query_encoder.output_features = 12 @ \u003cipython-input-2-1c737bdff90c\u003e:58:base_config\n",
- "query_encoder.name = \u003c[unset]\u003e\n",
- "query_encoder.parent = \u003c[unset]\u003e\n",
- "document_encoder.__fn_or_cls__ = \u003cclass '__main__.SimpleEncoder'\u003e @ \u003cipython-input-2-1c737bdff90c\u003e:59:base_config\n",
- "document_encoder.token_embedder.__fn_or_cls__ = \u003cclass '__main__.TokenEmbedder'\u003e @ \u003cipython-input-2-1c737bdff90c\u003e:49:base_config\n",
- "document_encoder.token_embedder.num_embeddings = 40 @ \u003cipython-input-9-1e867d8d9c8e\u003e:3:experiment_config\n",
- " - previously: 12 @ \u003cipython-input-2-1c737bdff90c\u003e:49:base_config\n",
- "document_encoder.token_embedder.features = 3 @ \u003cipython-input-2-1c737bdff90c\u003e:49:base_config\n",
- "document_encoder.token_embedder.embedding_init.__fn_or_cls__ = \u003cfunction variance_scaling at 0x7fd277681cf0\u003e @ \u003cipython-input-2-1c737bdff90c\u003e:53:base_config\n",
- "document_encoder.token_embedder.embedding_init.scale = 1.0 @ \u003cipython-input-2-1c737bdff90c\u003e:53:base_config\n",
- "document_encoder.token_embedder.embedding_init.mode = 'fan_in' @ \u003cipython-input-2-1c737bdff90c\u003e:53:base_config\n",
- "document_encoder.token_embedder.embedding_init.distribution = 'normal' @ \u003cipython-input-2-1c737bdff90c\u003e:53:base_config\n",
- "document_encoder.token_embedder.embedding_init.out_axis = 0 @ \u003cipython-input-2-1c737bdff90c\u003e:53:base_config\n",
- "document_encoder.token_embedder.embedding_init.batch_axis = \u003c[unset]\u003e\n",
- "document_encoder.token_embedder.embedding_init.dtype = \u003c[unset]\u003e\n",
- "document_encoder.token_embedder.embedding_init.in_axis = \u003c[unset]\u003e\n",
- "document_encoder.token_embedder.dtype = \u003c[unset]\u003e\n",
- "document_encoder.token_embedder.name = \u003c[unset]\u003e\n",
- "document_encoder.token_embedder.parent = \u003c[unset]\u003e\n",
- "document_encoder.output_features = 12 @ \u003cipython-input-2-1c737bdff90c\u003e:59:base_config\n",
- "document_encoder.name = \u003c[unset]\u003e\n",
- "document_encoder.parent = \u003c[unset]\u003e\n",
- "name = \u003c[unset]\u003e\n",
- "parent = \u003c[unset]\u003e\n"
+ "__fn_or_cls__ = @ :56:base_config\n",
+ "query_encoder.__fn_or_cls__ = @ :58:base_config\n",
+ "query_encoder.token_embedder.__fn_or_cls__ = @ :49:base_config\n",
+ "query_encoder.token_embedder.num_embeddings = 40 @ :3:experiment_config\n",
+ " - previously: 12 @ :49:base_config\n",
+ "query_encoder.token_embedder.features = 3 @ :49:base_config\n",
+ "query_encoder.token_embedder.embedding_init.__fn_or_cls__ = @ :53:base_config\n",
+ "query_encoder.token_embedder.embedding_init.scale = 1.0 @ :53:base_config\n",
+ "query_encoder.token_embedder.embedding_init.mode = 'fan_in' @ :53:base_config\n",
+ "query_encoder.token_embedder.embedding_init.distribution = 'normal' @ :53:base_config\n",
+ "query_encoder.token_embedder.embedding_init.out_axis = 0 @ :53:base_config\n",
+ "query_encoder.token_embedder.embedding_init.batch_axis = <[unset]>\n",
+ "query_encoder.token_embedder.embedding_init.dtype = <[unset]>\n",
+ "query_encoder.token_embedder.embedding_init.in_axis = <[unset]>\n",
+ "query_encoder.token_embedder.dtype = <[unset]>\n",
+ "query_encoder.token_embedder.name = <[unset]>\n",
+ "query_encoder.token_embedder.parent = <[unset]>\n",
+ "query_encoder.output_features = 12 @ :58:base_config\n",
+ "query_encoder.name = <[unset]>\n",
+ "query_encoder.parent = <[unset]>\n",
+ "document_encoder.__fn_or_cls__ = @ :59:base_config\n",
+ "document_encoder.token_embedder.__fn_or_cls__ = @ :49:base_config\n",
+ "document_encoder.token_embedder.num_embeddings = 40 @ :3:experiment_config\n",
+ " - previously: 12 @ :49:base_config\n",
+ "document_encoder.token_embedder.features = 3 @ :49:base_config\n",
+ "document_encoder.token_embedder.embedding_init.__fn_or_cls__ = @ :53:base_config\n",
+ "document_encoder.token_embedder.embedding_init.scale = 1.0 @ :53:base_config\n",
+ "document_encoder.token_embedder.embedding_init.mode = 'fan_in' @ :53:base_config\n",
+ "document_encoder.token_embedder.embedding_init.distribution = 'normal' @ :53:base_config\n",
+ "document_encoder.token_embedder.embedding_init.out_axis = 0 @ :53:base_config\n",
+ "document_encoder.token_embedder.embedding_init.batch_axis = <[unset]>\n",
+ "document_encoder.token_embedder.embedding_init.dtype = <[unset]>\n",
+ "document_encoder.token_embedder.embedding_init.in_axis = <[unset]>\n",
+ "document_encoder.token_embedder.dtype = <[unset]>\n",
+ "document_encoder.token_embedder.name = <[unset]>\n",
+ "document_encoder.token_embedder.parent = <[unset]>\n",
+ "document_encoder.output_features = 12 @ :59:base_config\n",
+ "document_encoder.name = <[unset]>\n",
+ "document_encoder.parent = <[unset]>\n",
+ "name = <[unset]>\n",
+ "parent = <[unset]>\n"
]
}
],