blob: f015c0bd4aa055902eca6184249786f2b957c6a5 [file] [log] [blame]
<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
<!-- Generated by graphviz version 2.43.0 (0)
-->
<!-- Title: %3 Pages: 1 -->
<svg width="1718pt" height="1916pt"
viewBox="0.00 0.00 1717.50 1916.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 1912)">
<title>%3</title>
<polygon fill="white" stroke="transparent" points="-4,4 -4,-1912 1713.5,-1912 1713.5,4 -4,4"/>
<!-- 0 -->
<g id="node1" class="node">
<title>0</title>
<ellipse fill="none" stroke="black" cx="947.5" cy="-1746" rx="170.87" ry="18"/>
<text text-anchor="middle" x="947.5" y="-1742.3" font-family="Times,serif" font-size="14.00">input: Tensor[(1, 14, 768), float32]</text>
</g>
<!-- 10 -->
<g id="node3" class="node">
<title>10</title>
<polygon fill="none" stroke="black" points="1089.5,-1692 737.5,-1692 737.5,-1656 1089.5,-1656 1089.5,-1692"/>
<text text-anchor="middle" x="913.5" y="-1670.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[&#45;1, 14, 768], reverse=0)</text>
</g>
<!-- 0&#45;&gt;10 -->
<g id="edge1" class="edge">
<title>0&#45;&gt;10</title>
<path fill="none" stroke="black" d="M939.1,-1727.7C935.23,-1719.73 930.55,-1710.1 926.26,-1701.26"/>
<polygon fill="black" stroke="black" points="929.33,-1699.57 921.81,-1692.1 923.03,-1702.63 929.33,-1699.57"/>
</g>
<!-- 1 -->
<g id="node2" class="node">
<title>1</title>
<ellipse fill="none" stroke="black" cx="1084.5" cy="-882" rx="217.96" ry="18"/>
<text text-anchor="middle" x="1084.5" y="-878.3" font-family="Times,serif" font-size="14.00">attention_mask: Tensor[(1, 1, 1, 14), float32]</text>
</g>
<!-- 39 -->
<g id="node31" class="node">
<title>39</title>
<polygon fill="none" stroke="black" points="1120,-828 1049,-828 1049,-792 1120,-792 1120,-828"/>
<text text-anchor="middle" x="1084.5" y="-806.3" font-family="Times,serif" font-size="14.00">add(·, ·)</text>
</g>
<!-- 1&#45;&gt;39 -->
<g id="edge31" class="edge">
<title>1&#45;&gt;39</title>
<path fill="none" stroke="black" d="M1084.5,-863.7C1084.5,-855.98 1084.5,-846.71 1084.5,-838.11"/>
<polygon fill="black" stroke="black" points="1088,-838.1 1084.5,-828.1 1081,-838.1 1088,-838.1"/>
</g>
<!-- 15 -->
<g id="node8" class="node">
<title>15</title>
<polygon fill="none" stroke="black" points="834,-1620 665,-1620 665,-1584 834,-1584 834,-1620"/>
<text text-anchor="middle" x="749.5" y="-1598.3" font-family="Times,serif" font-size="14.00">nn.batch_matmul(·, ·)</text>
</g>
<!-- 10&#45;&gt;15 -->
<g id="edge5" class="edge">
<title>10&#45;&gt;15</title>
<path fill="none" stroke="black" d="M873.38,-1655.88C850.86,-1646.26 822.58,-1634.19 798.73,-1624.01"/>
<polygon fill="black" stroke="black" points="800.06,-1620.77 789.49,-1620.07 797.31,-1627.21 800.06,-1620.77"/>
</g>
<!-- 26 -->
<g id="node19" class="node">
<title>26</title>
<polygon fill="none" stroke="black" points="275,-1620 106,-1620 106,-1584 275,-1584 275,-1620"/>
<text text-anchor="middle" x="190.5" y="-1598.3" font-family="Times,serif" font-size="14.00">nn.batch_matmul(·, ·)</text>
</g>
<!-- 10&#45;&gt;26 -->
<g id="edge16" class="edge">
<title>10&#45;&gt;26</title>
<path fill="none" stroke="black" d="M737.56,-1655.97C595.14,-1642.18 400.01,-1623.28 285.39,-1612.19"/>
<polygon fill="black" stroke="black" points="285.53,-1608.68 275.24,-1611.2 284.86,-1615.65 285.53,-1608.68"/>
</g>
<!-- 48 -->
<g id="node40" class="node">
<title>48</title>
<polygon fill="none" stroke="black" points="1405,-1620 1236,-1620 1236,-1584 1405,-1584 1405,-1620"/>
<text text-anchor="middle" x="1320.5" y="-1598.3" font-family="Times,serif" font-size="14.00">nn.batch_matmul(·, ·)</text>
</g>
<!-- 10&#45;&gt;48 -->
<g id="edge39" class="edge">
<title>10&#45;&gt;48</title>
<path fill="none" stroke="black" d="M1012.54,-1655.97C1077.43,-1644.81 1161.75,-1630.3 1225.75,-1619.3"/>
<polygon fill="black" stroke="black" points="1226.58,-1622.71 1235.84,-1617.56 1225.39,-1615.81 1226.58,-1622.71"/>
</g>
<!-- 11 -->
<g id="node4" class="node">
<title>11</title>
<polygon fill="none" stroke="black" points="690.5,-1908 466.5,-1908 466.5,-1872 690.5,-1872 690.5,-1908"/>
<text text-anchor="middle" x="578.5" y="-1886.3" font-family="Times,serif" font-size="14.00">Constant((768, 768), float32)</text>
</g>
<!-- 12 -->
<g id="node5" class="node">
<title>12</title>
<polygon fill="none" stroke="black" points="675,-1836 482,-1836 482,-1800 675,-1800 675,-1836"/>
<text text-anchor="middle" x="578.5" y="-1814.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[1, 0])</text>
</g>
<!-- 11&#45;&gt;12 -->
<g id="edge2" class="edge">
<title>11&#45;&gt;12</title>
<path fill="none" stroke="black" d="M578.5,-1871.7C578.5,-1863.98 578.5,-1854.71 578.5,-1846.11"/>
<polygon fill="black" stroke="black" points="582,-1846.1 578.5,-1836.1 575,-1846.1 582,-1846.1"/>
</g>
<!-- 13 -->
<g id="node6" class="node">
<title>13</title>
<polygon fill="none" stroke="black" points="759,-1764 398,-1764 398,-1728 759,-1728 759,-1764"/>
<text text-anchor="middle" x="578.5" y="-1742.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[&#45;1, 768, 768], reverse=0)</text>
</g>
<!-- 12&#45;&gt;13 -->
<g id="edge3" class="edge">
<title>12&#45;&gt;13</title>
<path fill="none" stroke="black" d="M578.5,-1799.7C578.5,-1791.98 578.5,-1782.71 578.5,-1774.11"/>
<polygon fill="black" stroke="black" points="582,-1774.1 578.5,-1764.1 575,-1774.1 582,-1774.1"/>
</g>
<!-- 14 -->
<g id="node7" class="node">
<title>14</title>
<polygon fill="none" stroke="black" points="701,-1692 490,-1692 490,-1656 701,-1656 701,-1692"/>
<text text-anchor="middle" x="595.5" y="-1670.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[0, 2, 1])</text>
</g>
<!-- 13&#45;&gt;14 -->
<g id="edge4" class="edge">
<title>13&#45;&gt;14</title>
<path fill="none" stroke="black" d="M582.7,-1727.7C584.6,-1719.9 586.88,-1710.51 588.98,-1701.83"/>
<polygon fill="black" stroke="black" points="592.39,-1702.65 591.35,-1692.1 585.58,-1701 592.39,-1702.65"/>
</g>
<!-- 14&#45;&gt;15 -->
<g id="edge6" class="edge">
<title>14&#45;&gt;15</title>
<path fill="none" stroke="black" d="M633.17,-1655.88C654.13,-1646.35 680.4,-1634.41 702.68,-1624.28"/>
<polygon fill="black" stroke="black" points="704.29,-1627.39 711.95,-1620.07 701.4,-1621.02 704.29,-1627.39"/>
</g>
<!-- 16 -->
<g id="node9" class="node">
<title>16</title>
<polygon fill="none" stroke="black" points="923,-1548 576,-1548 576,-1512 923,-1512 923,-1548"/>
<text text-anchor="middle" x="749.5" y="-1526.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[1, 14, 768], reverse=0)</text>
</g>
<!-- 15&#45;&gt;16 -->
<g id="edge7" class="edge">
<title>15&#45;&gt;16</title>
<path fill="none" stroke="black" d="M749.5,-1583.7C749.5,-1575.98 749.5,-1566.71 749.5,-1558.11"/>
<polygon fill="black" stroke="black" points="753,-1558.1 749.5,-1548.1 746,-1558.1 753,-1558.1"/>
</g>
<!-- 18 -->
<g id="node11" class="node">
<title>18</title>
<polygon fill="none" stroke="black" points="869,-1476 798,-1476 798,-1440 869,-1440 869,-1476"/>
<text text-anchor="middle" x="833.5" y="-1454.3" font-family="Times,serif" font-size="14.00">add(·, ·)</text>
</g>
<!-- 16&#45;&gt;18 -->
<g id="edge8" class="edge">
<title>16&#45;&gt;18</title>
<path fill="none" stroke="black" d="M770.26,-1511.7C780.74,-1502.97 793.61,-1492.24 805,-1482.75"/>
<polygon fill="black" stroke="black" points="807.53,-1485.19 812.97,-1476.1 803.05,-1479.82 807.53,-1485.19"/>
</g>
<!-- 17 -->
<g id="node10" class="node">
<title>17</title>
<polygon fill="none" stroke="black" points="1133.5,-1548 941.5,-1548 941.5,-1512 1133.5,-1512 1133.5,-1548"/>
<text text-anchor="middle" x="1037.5" y="-1526.3" font-family="Times,serif" font-size="14.00">Constant((768,), float32)</text>
</g>
<!-- 17&#45;&gt;18 -->
<g id="edge9" class="edge">
<title>17&#45;&gt;18</title>
<path fill="none" stroke="black" d="M987.86,-1511.97C954.62,-1500.56 911.2,-1485.66 878.88,-1474.57"/>
<polygon fill="black" stroke="black" points="879.83,-1471.2 869.23,-1471.26 877.55,-1477.82 879.83,-1471.2"/>
</g>
<!-- 19 -->
<g id="node12" class="node">
<title>19</title>
<polygon fill="none" stroke="black" points="1016,-1404 651,-1404 651,-1368 1016,-1368 1016,-1404"/>
<text text-anchor="middle" x="833.5" y="-1382.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[1, 14, 12, 64], reverse=0)</text>
</g>
<!-- 18&#45;&gt;19 -->
<g id="edge10" class="edge">
<title>18&#45;&gt;19</title>
<path fill="none" stroke="black" d="M833.5,-1439.7C833.5,-1431.98 833.5,-1422.71 833.5,-1414.11"/>
<polygon fill="black" stroke="black" points="837,-1414.1 833.5,-1404.1 830,-1414.1 837,-1414.1"/>
</g>
<!-- 20 -->
<g id="node13" class="node">
<title>20</title>
<polygon fill="none" stroke="black" points="921,-1332 692,-1332 692,-1296 921,-1296 921,-1332"/>
<text text-anchor="middle" x="806.5" y="-1310.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[0, 2, 1, 3])</text>
</g>
<!-- 19&#45;&gt;20 -->
<g id="edge11" class="edge">
<title>19&#45;&gt;20</title>
<path fill="none" stroke="black" d="M826.83,-1367.7C823.79,-1359.81 820.12,-1350.3 816.74,-1341.55"/>
<polygon fill="black" stroke="black" points="819.96,-1340.17 813.1,-1332.1 813.43,-1342.69 819.96,-1340.17"/>
</g>
<!-- 21 -->
<g id="node14" class="node">
<title>21</title>
<polygon fill="none" stroke="black" points="973,-1116 630,-1116 630,-1080 973,-1080 973,-1116"/>
<text text-anchor="middle" x="801.5" y="-1094.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[&#45;1, 14, 64], reverse=0)</text>
</g>
<!-- 20&#45;&gt;21 -->
<g id="edge12" class="edge">
<title>20&#45;&gt;21</title>
<path fill="none" stroke="black" d="M806.1,-1295.85C805.23,-1258.83 803.19,-1171.18 802.14,-1126.39"/>
<polygon fill="black" stroke="black" points="805.64,-1126.15 801.9,-1116.23 798.64,-1126.31 805.64,-1126.15"/>
</g>
<!-- 35 -->
<g id="node28" class="node">
<title>35</title>
<polygon fill="none" stroke="black" points="880,-1044 711,-1044 711,-1008 880,-1008 880,-1044"/>
<text text-anchor="middle" x="795.5" y="-1022.3" font-family="Times,serif" font-size="14.00">nn.batch_matmul(·, ·)</text>
</g>
<!-- 21&#45;&gt;35 -->
<g id="edge26" class="edge">
<title>21&#45;&gt;35</title>
<path fill="none" stroke="black" d="M800.02,-1079.7C799.36,-1071.98 798.56,-1062.71 797.82,-1054.11"/>
<polygon fill="black" stroke="black" points="801.31,-1053.77 796.97,-1044.1 794.33,-1054.37 801.31,-1053.77"/>
</g>
<!-- 22 -->
<g id="node15" class="node">
<title>22</title>
<polygon fill="none" stroke="black" points="302.5,-1908 78.5,-1908 78.5,-1872 302.5,-1872 302.5,-1908"/>
<text text-anchor="middle" x="190.5" y="-1886.3" font-family="Times,serif" font-size="14.00">Constant((768, 768), float32)</text>
</g>
<!-- 23 -->
<g id="node16" class="node">
<title>23</title>
<polygon fill="none" stroke="black" points="287,-1836 94,-1836 94,-1800 287,-1800 287,-1836"/>
<text text-anchor="middle" x="190.5" y="-1814.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[1, 0])</text>
</g>
<!-- 22&#45;&gt;23 -->
<g id="edge13" class="edge">
<title>22&#45;&gt;23</title>
<path fill="none" stroke="black" d="M190.5,-1871.7C190.5,-1863.98 190.5,-1854.71 190.5,-1846.11"/>
<polygon fill="black" stroke="black" points="194,-1846.1 190.5,-1836.1 187,-1846.1 194,-1846.1"/>
</g>
<!-- 24 -->
<g id="node17" class="node">
<title>24</title>
<polygon fill="none" stroke="black" points="371,-1764 10,-1764 10,-1728 371,-1728 371,-1764"/>
<text text-anchor="middle" x="190.5" y="-1742.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[&#45;1, 768, 768], reverse=0)</text>
</g>
<!-- 23&#45;&gt;24 -->
<g id="edge14" class="edge">
<title>23&#45;&gt;24</title>
<path fill="none" stroke="black" d="M190.5,-1799.7C190.5,-1791.98 190.5,-1782.71 190.5,-1774.11"/>
<polygon fill="black" stroke="black" points="194,-1774.1 190.5,-1764.1 187,-1774.1 194,-1774.1"/>
</g>
<!-- 25 -->
<g id="node18" class="node">
<title>25</title>
<polygon fill="none" stroke="black" points="296,-1692 85,-1692 85,-1656 296,-1656 296,-1692"/>
<text text-anchor="middle" x="190.5" y="-1670.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[0, 2, 1])</text>
</g>
<!-- 24&#45;&gt;25 -->
<g id="edge15" class="edge">
<title>24&#45;&gt;25</title>
<path fill="none" stroke="black" d="M190.5,-1727.7C190.5,-1719.98 190.5,-1710.71 190.5,-1702.11"/>
<polygon fill="black" stroke="black" points="194,-1702.1 190.5,-1692.1 187,-1702.1 194,-1702.1"/>
</g>
<!-- 25&#45;&gt;26 -->
<g id="edge17" class="edge">
<title>25&#45;&gt;26</title>
<path fill="none" stroke="black" d="M190.5,-1655.7C190.5,-1647.98 190.5,-1638.71 190.5,-1630.11"/>
<polygon fill="black" stroke="black" points="194,-1630.1 190.5,-1620.1 187,-1630.1 194,-1630.1"/>
</g>
<!-- 27 -->
<g id="node20" class="node">
<title>27</title>
<polygon fill="none" stroke="black" points="347,-1548 0,-1548 0,-1512 347,-1512 347,-1548"/>
<text text-anchor="middle" x="173.5" y="-1526.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[1, 14, 768], reverse=0)</text>
</g>
<!-- 26&#45;&gt;27 -->
<g id="edge18" class="edge">
<title>26&#45;&gt;27</title>
<path fill="none" stroke="black" d="M186.3,-1583.7C184.4,-1575.9 182.12,-1566.51 180.02,-1557.83"/>
<polygon fill="black" stroke="black" points="183.42,-1557 177.65,-1548.1 176.61,-1558.65 183.42,-1557"/>
</g>
<!-- 29 -->
<g id="node22" class="node">
<title>29</title>
<polygon fill="none" stroke="black" points="486,-1476 415,-1476 415,-1440 486,-1440 486,-1476"/>
<text text-anchor="middle" x="450.5" y="-1454.3" font-family="Times,serif" font-size="14.00">add(·, ·)</text>
</g>
<!-- 27&#45;&gt;29 -->
<g id="edge19" class="edge">
<title>27&#45;&gt;29</title>
<path fill="none" stroke="black" d="M240.91,-1511.97C291.72,-1499.13 360.04,-1481.86 404.66,-1470.58"/>
<polygon fill="black" stroke="black" points="405.8,-1473.91 414.64,-1468.06 404.09,-1467.12 405.8,-1473.91"/>
</g>
<!-- 28 -->
<g id="node21" class="node">
<title>28</title>
<polygon fill="none" stroke="black" points="557.5,-1548 365.5,-1548 365.5,-1512 557.5,-1512 557.5,-1548"/>
<text text-anchor="middle" x="461.5" y="-1526.3" font-family="Times,serif" font-size="14.00">Constant((768,), float32)</text>
</g>
<!-- 28&#45;&gt;29 -->
<g id="edge20" class="edge">
<title>28&#45;&gt;29</title>
<path fill="none" stroke="black" d="M458.78,-1511.7C457.57,-1503.98 456.11,-1494.71 454.76,-1486.11"/>
<polygon fill="black" stroke="black" points="458.2,-1485.44 453.19,-1476.1 451.28,-1486.53 458.2,-1485.44"/>
</g>
<!-- 30 -->
<g id="node23" class="node">
<title>30</title>
<polygon fill="none" stroke="black" points="633,-1404 268,-1404 268,-1368 633,-1368 633,-1404"/>
<text text-anchor="middle" x="450.5" y="-1382.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[1, 14, 12, 64], reverse=0)</text>
</g>
<!-- 29&#45;&gt;30 -->
<g id="edge21" class="edge">
<title>29&#45;&gt;30</title>
<path fill="none" stroke="black" d="M450.5,-1439.7C450.5,-1431.98 450.5,-1422.71 450.5,-1414.11"/>
<polygon fill="black" stroke="black" points="454,-1414.1 450.5,-1404.1 447,-1414.1 454,-1414.1"/>
</g>
<!-- 31 -->
<g id="node24" class="node">
<title>31</title>
<polygon fill="none" stroke="black" points="566,-1332 337,-1332 337,-1296 566,-1296 566,-1332"/>
<text text-anchor="middle" x="451.5" y="-1310.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[0, 2, 1, 3])</text>
</g>
<!-- 30&#45;&gt;31 -->
<g id="edge22" class="edge">
<title>30&#45;&gt;31</title>
<path fill="none" stroke="black" d="M450.75,-1367.7C450.86,-1359.98 450.99,-1350.71 451.11,-1342.11"/>
<polygon fill="black" stroke="black" points="454.61,-1342.15 451.26,-1332.1 447.61,-1342.05 454.61,-1342.15"/>
</g>
<!-- 32 -->
<g id="node25" class="node">
<title>32</title>
<polygon fill="none" stroke="black" points="596,-1260 367,-1260 367,-1224 596,-1224 596,-1260"/>
<text text-anchor="middle" x="481.5" y="-1238.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[0, 1, 3, 2])</text>
</g>
<!-- 31&#45;&gt;32 -->
<g id="edge23" class="edge">
<title>31&#45;&gt;32</title>
<path fill="none" stroke="black" d="M458.92,-1295.7C462.29,-1287.81 466.37,-1278.3 470.12,-1269.55"/>
<polygon fill="black" stroke="black" points="473.45,-1270.67 474.17,-1260.1 467.01,-1267.92 473.45,-1270.67"/>
</g>
<!-- 33 -->
<g id="node26" class="node">
<title>33</title>
<polygon fill="none" stroke="black" points="668,-1188 325,-1188 325,-1152 668,-1152 668,-1188"/>
<text text-anchor="middle" x="496.5" y="-1166.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[&#45;1, 64, 14], reverse=0)</text>
</g>
<!-- 32&#45;&gt;33 -->
<g id="edge24" class="edge">
<title>32&#45;&gt;33</title>
<path fill="none" stroke="black" d="M485.21,-1223.7C486.86,-1215.98 488.85,-1206.71 490.69,-1198.11"/>
<polygon fill="black" stroke="black" points="494.16,-1198.62 492.83,-1188.1 487.32,-1197.15 494.16,-1198.62"/>
</g>
<!-- 34 -->
<g id="node27" class="node">
<title>34</title>
<polygon fill="none" stroke="black" points="610,-1116 399,-1116 399,-1080 610,-1080 610,-1116"/>
<text text-anchor="middle" x="504.5" y="-1094.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[0, 2, 1])</text>
</g>
<!-- 33&#45;&gt;34 -->
<g id="edge25" class="edge">
<title>33&#45;&gt;34</title>
<path fill="none" stroke="black" d="M498.48,-1151.7C499.36,-1143.98 500.42,-1134.71 501.4,-1126.11"/>
<polygon fill="black" stroke="black" points="504.89,-1126.44 502.55,-1116.1 497.93,-1125.64 504.89,-1126.44"/>
</g>
<!-- 34&#45;&gt;35 -->
<g id="edge27" class="edge">
<title>34&#45;&gt;35</title>
<path fill="none" stroke="black" d="M575.31,-1079.97C617.47,-1069.83 671.09,-1056.93 714.87,-1046.4"/>
<polygon fill="black" stroke="black" points="715.72,-1049.79 724.62,-1044.05 714.08,-1042.99 715.72,-1049.79"/>
</g>
<!-- 36 -->
<g id="node29" class="node">
<title>36</title>
<polygon fill="none" stroke="black" points="978,-972 613,-972 613,-936 978,-936 978,-972"/>
<text text-anchor="middle" x="795.5" y="-950.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[1, 12, 14, 14], reverse=0)</text>
</g>
<!-- 35&#45;&gt;36 -->
<g id="edge28" class="edge">
<title>35&#45;&gt;36</title>
<path fill="none" stroke="black" d="M795.5,-1007.7C795.5,-999.98 795.5,-990.71 795.5,-982.11"/>
<polygon fill="black" stroke="black" points="799,-982.1 795.5,-972.1 792,-982.1 799,-982.1"/>
</g>
<!-- 38 -->
<g id="node30" class="node">
<title>38</title>
<polygon fill="none" stroke="black" points="849,-900 742,-900 742,-864 849,-864 849,-900"/>
<text text-anchor="middle" x="795.5" y="-878.3" font-family="Times,serif" font-size="14.00">divide(·, 8.0)</text>
</g>
<!-- 36&#45;&gt;38 -->
<g id="edge29" class="edge">
<title>36&#45;&gt;38</title>
<path fill="none" stroke="black" d="M795.5,-935.7C795.5,-927.98 795.5,-918.71 795.5,-910.11"/>
<polygon fill="black" stroke="black" points="799,-910.1 795.5,-900.1 792,-910.1 799,-910.1"/>
</g>
<!-- 38&#45;&gt;39 -->
<g id="edge30" class="edge">
<title>38&#45;&gt;39</title>
<path fill="none" stroke="black" d="M849.24,-866.13C852.03,-865.4 854.8,-864.69 857.5,-864 920.04,-848.13 992.73,-831.47 1038.67,-821.16"/>
<polygon fill="black" stroke="black" points="1039.63,-824.53 1048.62,-818.93 1038.1,-817.7 1039.63,-824.53"/>
</g>
<!-- 40 -->
<g id="node32" class="node">
<title>40</title>
<polygon fill="none" stroke="black" points="1194.5,-756 1020.5,-756 1020.5,-720 1194.5,-720 1194.5,-756"/>
<text text-anchor="middle" x="1107.5" y="-734.3" font-family="Times,serif" font-size="14.00">nn.softmax(·| axis=&#45;1)</text>
</g>
<!-- 39&#45;&gt;40 -->
<g id="edge32" class="edge">
<title>39&#45;&gt;40</title>
<path fill="none" stroke="black" d="M1090.19,-791.7C1092.75,-783.9 1095.83,-774.51 1098.68,-765.83"/>
<polygon fill="black" stroke="black" points="1102.08,-766.7 1101.88,-756.1 1095.43,-764.51 1102.08,-766.7"/>
</g>
<!-- 41 -->
<g id="node33" class="node">
<title>41</title>
<polygon fill="none" stroke="black" points="1211,-684 1028,-684 1028,-648 1211,-648 1211,-684"/>
<text text-anchor="middle" x="1119.5" y="-662.3" font-family="Times,serif" font-size="14.00">nn.dropout(·| rate=0.1)</text>
</g>
<!-- 40&#45;&gt;41 -->
<g id="edge33" class="edge">
<title>40&#45;&gt;41</title>
<path fill="none" stroke="black" d="M1110.47,-719.7C1111.79,-711.98 1113.38,-702.71 1114.85,-694.11"/>
<polygon fill="black" stroke="black" points="1118.33,-694.55 1116.57,-684.1 1111.43,-693.37 1118.33,-694.55"/>
</g>
<!-- 42 -->
<g id="node34" class="node">
<title>42</title>
<polygon fill="none" stroke="black" points="1209.5,-612 1041.5,-612 1041.5,-576 1209.5,-576 1209.5,-612"/>
<text text-anchor="middle" x="1125.5" y="-590.3" font-family="Times,serif" font-size="14.00">TupleGetItem(idx=0)</text>
</g>
<!-- 41&#45;&gt;42 -->
<g id="edge34" class="edge">
<title>41&#45;&gt;42</title>
<path fill="none" stroke="black" d="M1120.98,-647.7C1121.64,-639.98 1122.44,-630.71 1123.18,-622.11"/>
<polygon fill="black" stroke="black" points="1126.67,-622.37 1124.03,-612.1 1119.69,-621.77 1126.67,-622.37"/>
</g>
<!-- 43 -->
<g id="node35" class="node">
<title>43</title>
<polygon fill="none" stroke="black" points="1300,-540 957,-540 957,-504 1300,-504 1300,-540"/>
<text text-anchor="middle" x="1128.5" y="-518.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[&#45;1, 14, 14], reverse=0)</text>
</g>
<!-- 42&#45;&gt;43 -->
<g id="edge35" class="edge">
<title>42&#45;&gt;43</title>
<path fill="none" stroke="black" d="M1126.24,-575.7C1126.57,-567.98 1126.97,-558.71 1127.34,-550.11"/>
<polygon fill="black" stroke="black" points="1130.84,-550.25 1127.77,-540.1 1123.84,-549.95 1130.84,-550.25"/>
</g>
<!-- 56 -->
<g id="node48" class="node">
<title>56</title>
<polygon fill="none" stroke="black" points="1312,-468 1143,-468 1143,-432 1312,-432 1312,-468"/>
<text text-anchor="middle" x="1227.5" y="-446.3" font-family="Times,serif" font-size="14.00">nn.batch_matmul(·, ·)</text>
</g>
<!-- 43&#45;&gt;56 -->
<g id="edge48" class="edge">
<title>43&#45;&gt;56</title>
<path fill="none" stroke="black" d="M1152.72,-503.88C1165.42,-494.89 1181.16,-483.76 1194.92,-474.03"/>
<polygon fill="black" stroke="black" points="1197.04,-476.82 1203.19,-468.19 1193,-471.11 1197.04,-476.82"/>
</g>
<!-- 44 -->
<g id="node36" class="node">
<title>44</title>
<polygon fill="none" stroke="black" points="1432.5,-1908 1208.5,-1908 1208.5,-1872 1432.5,-1872 1432.5,-1908"/>
<text text-anchor="middle" x="1320.5" y="-1886.3" font-family="Times,serif" font-size="14.00">Constant((768, 768), float32)</text>
</g>
<!-- 45 -->
<g id="node37" class="node">
<title>45</title>
<polygon fill="none" stroke="black" points="1417,-1836 1224,-1836 1224,-1800 1417,-1800 1417,-1836"/>
<text text-anchor="middle" x="1320.5" y="-1814.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[1, 0])</text>
</g>
<!-- 44&#45;&gt;45 -->
<g id="edge36" class="edge">
<title>44&#45;&gt;45</title>
<path fill="none" stroke="black" d="M1320.5,-1871.7C1320.5,-1863.98 1320.5,-1854.71 1320.5,-1846.11"/>
<polygon fill="black" stroke="black" points="1324,-1846.1 1320.5,-1836.1 1317,-1846.1 1324,-1846.1"/>
</g>
<!-- 46 -->
<g id="node38" class="node">
<title>46</title>
<polygon fill="none" stroke="black" points="1501,-1764 1140,-1764 1140,-1728 1501,-1728 1501,-1764"/>
<text text-anchor="middle" x="1320.5" y="-1742.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[&#45;1, 768, 768], reverse=0)</text>
</g>
<!-- 45&#45;&gt;46 -->
<g id="edge37" class="edge">
<title>45&#45;&gt;46</title>
<path fill="none" stroke="black" d="M1320.5,-1799.7C1320.5,-1791.98 1320.5,-1782.71 1320.5,-1774.11"/>
<polygon fill="black" stroke="black" points="1324,-1774.1 1320.5,-1764.1 1317,-1774.1 1324,-1774.1"/>
</g>
<!-- 47 -->
<g id="node39" class="node">
<title>47</title>
<polygon fill="none" stroke="black" points="1426,-1692 1215,-1692 1215,-1656 1426,-1656 1426,-1692"/>
<text text-anchor="middle" x="1320.5" y="-1670.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[0, 2, 1])</text>
</g>
<!-- 46&#45;&gt;47 -->
<g id="edge38" class="edge">
<title>46&#45;&gt;47</title>
<path fill="none" stroke="black" d="M1320.5,-1727.7C1320.5,-1719.98 1320.5,-1710.71 1320.5,-1702.11"/>
<polygon fill="black" stroke="black" points="1324,-1702.1 1320.5,-1692.1 1317,-1702.1 1324,-1702.1"/>
</g>
<!-- 47&#45;&gt;48 -->
<g id="edge40" class="edge">
<title>47&#45;&gt;48</title>
<path fill="none" stroke="black" d="M1320.5,-1655.7C1320.5,-1647.98 1320.5,-1638.71 1320.5,-1630.11"/>
<polygon fill="black" stroke="black" points="1324,-1630.1 1320.5,-1620.1 1317,-1630.1 1324,-1630.1"/>
</g>
<!-- 49 -->
<g id="node41" class="node">
<title>49</title>
<polygon fill="none" stroke="black" points="1499,-1548 1152,-1548 1152,-1512 1499,-1512 1499,-1548"/>
<text text-anchor="middle" x="1325.5" y="-1526.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[1, 14, 768], reverse=0)</text>
</g>
<!-- 48&#45;&gt;49 -->
<g id="edge41" class="edge">
<title>48&#45;&gt;49</title>
<path fill="none" stroke="black" d="M1321.74,-1583.7C1322.29,-1575.98 1322.95,-1566.71 1323.56,-1558.11"/>
<polygon fill="black" stroke="black" points="1327.06,-1558.33 1324.28,-1548.1 1320.07,-1557.83 1327.06,-1558.33"/>
</g>
<!-- 51 -->
<g id="node43" class="node">
<title>51</title>
<polygon fill="none" stroke="black" points="1366,-1476 1295,-1476 1295,-1440 1366,-1440 1366,-1476"/>
<text text-anchor="middle" x="1330.5" y="-1454.3" font-family="Times,serif" font-size="14.00">add(·, ·)</text>
</g>
<!-- 49&#45;&gt;51 -->
<g id="edge42" class="edge">
<title>49&#45;&gt;51</title>
<path fill="none" stroke="black" d="M1326.74,-1511.7C1327.29,-1503.98 1327.95,-1494.71 1328.56,-1486.11"/>
<polygon fill="black" stroke="black" points="1332.06,-1486.33 1329.28,-1476.1 1325.07,-1485.83 1332.06,-1486.33"/>
</g>
<!-- 50 -->
<g id="node42" class="node">
<title>50</title>
<polygon fill="none" stroke="black" points="1709.5,-1548 1517.5,-1548 1517.5,-1512 1709.5,-1512 1709.5,-1548"/>
<text text-anchor="middle" x="1613.5" y="-1526.3" font-family="Times,serif" font-size="14.00">Constant((768,), float32)</text>
</g>
<!-- 50&#45;&gt;51 -->
<g id="edge43" class="edge">
<title>50&#45;&gt;51</title>
<path fill="none" stroke="black" d="M1544.63,-1511.97C1492.31,-1499.02 1421.8,-1481.58 1376.25,-1470.32"/>
<polygon fill="black" stroke="black" points="1376.9,-1466.87 1366.36,-1467.87 1375.22,-1473.67 1376.9,-1466.87"/>
</g>
<!-- 52 -->
<g id="node44" class="node">
<title>52</title>
<polygon fill="none" stroke="black" points="1513,-1404 1148,-1404 1148,-1368 1513,-1368 1513,-1404"/>
<text text-anchor="middle" x="1330.5" y="-1382.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[1, 14, 12, 64], reverse=0)</text>
</g>
<!-- 51&#45;&gt;52 -->
<g id="edge44" class="edge">
<title>51&#45;&gt;52</title>
<path fill="none" stroke="black" d="M1330.5,-1439.7C1330.5,-1431.98 1330.5,-1422.71 1330.5,-1414.11"/>
<polygon fill="black" stroke="black" points="1334,-1414.1 1330.5,-1404.1 1327,-1414.1 1334,-1414.1"/>
</g>
<!-- 53 -->
<g id="node45" class="node">
<title>53</title>
<polygon fill="none" stroke="black" points="1445,-1332 1216,-1332 1216,-1296 1445,-1296 1445,-1332"/>
<text text-anchor="middle" x="1330.5" y="-1310.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[0, 2, 1, 3])</text>
</g>
<!-- 52&#45;&gt;53 -->
<g id="edge45" class="edge">
<title>52&#45;&gt;53</title>
<path fill="none" stroke="black" d="M1330.5,-1367.7C1330.5,-1359.98 1330.5,-1350.71 1330.5,-1342.11"/>
<polygon fill="black" stroke="black" points="1334,-1342.1 1330.5,-1332.1 1327,-1342.1 1334,-1342.1"/>
</g>
<!-- 54 -->
<g id="node46" class="node">
<title>54</title>
<polygon fill="none" stroke="black" points="1502,-1260 1159,-1260 1159,-1224 1502,-1224 1502,-1260"/>
<text text-anchor="middle" x="1330.5" y="-1238.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[&#45;1, 14, 64], reverse=0)</text>
</g>
<!-- 53&#45;&gt;54 -->
<g id="edge46" class="edge">
<title>53&#45;&gt;54</title>
<path fill="none" stroke="black" d="M1330.5,-1295.7C1330.5,-1287.98 1330.5,-1278.71 1330.5,-1270.11"/>
<polygon fill="black" stroke="black" points="1334,-1270.1 1330.5,-1260.1 1327,-1270.1 1334,-1270.1"/>
</g>
<!-- 55 -->
<g id="node47" class="node">
<title>55</title>
<polygon fill="none" stroke="black" points="1436,-1044 1225,-1044 1225,-1008 1436,-1008 1436,-1044"/>
<text text-anchor="middle" x="1330.5" y="-1022.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[0, 2, 1])</text>
</g>
<!-- 54&#45;&gt;55 -->
<g id="edge47" class="edge">
<title>54&#45;&gt;55</title>
<path fill="none" stroke="black" d="M1330.5,-1223.85C1330.5,-1186.83 1330.5,-1099.18 1330.5,-1054.39"/>
<polygon fill="black" stroke="black" points="1334,-1054.23 1330.5,-1044.23 1327,-1054.23 1334,-1054.23"/>
</g>
<!-- 55&#45;&gt;56 -->
<g id="edge49" class="edge">
<title>55&#45;&gt;56</title>
<path fill="none" stroke="black" d="M1330.5,-1007.95C1330.5,-981.29 1330.5,-928.11 1330.5,-883 1330.5,-883 1330.5,-883 1330.5,-593 1330.5,-552.36 1332.93,-537.21 1309.5,-504 1300.77,-491.62 1288.14,-481.42 1275.4,-473.4"/>
<polygon fill="black" stroke="black" points="1276.99,-470.27 1266.6,-468.19 1273.42,-476.3 1276.99,-470.27"/>
</g>
<!-- 57 -->
<g id="node49" class="node">
<title>57</title>
<polygon fill="none" stroke="black" points="1410,-396 1045,-396 1045,-360 1410,-360 1410,-396"/>
<text text-anchor="middle" x="1227.5" y="-374.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[1, 12, 14, 64], reverse=0)</text>
</g>
<!-- 56&#45;&gt;57 -->
<g id="edge50" class="edge">
<title>56&#45;&gt;57</title>
<path fill="none" stroke="black" d="M1227.5,-431.7C1227.5,-423.98 1227.5,-414.71 1227.5,-406.11"/>
<polygon fill="black" stroke="black" points="1231,-406.1 1227.5,-396.1 1224,-406.1 1231,-406.1"/>
</g>
<!-- 58 -->
<g id="node50" class="node">
<title>58</title>
<polygon fill="none" stroke="black" points="1342,-324 1113,-324 1113,-288 1342,-288 1342,-324"/>
<text text-anchor="middle" x="1227.5" y="-302.3" font-family="Times,serif" font-size="14.00">transpose(·| axes=[0, 2, 1, 3])</text>
</g>
<!-- 57&#45;&gt;58 -->
<g id="edge51" class="edge">
<title>57&#45;&gt;58</title>
<path fill="none" stroke="black" d="M1227.5,-359.7C1227.5,-351.98 1227.5,-342.71 1227.5,-334.11"/>
<polygon fill="black" stroke="black" points="1231,-334.1 1227.5,-324.1 1224,-334.1 1231,-334.1"/>
</g>
<!-- 59 -->
<g id="node51" class="node">
<title>59</title>
<polygon fill="none" stroke="black" points="1260,-252 1195,-252 1195,-216 1260,-216 1260,-252"/>
<text text-anchor="middle" x="1227.5" y="-230.3" font-family="Times,serif" font-size="14.00">copy(·)</text>
</g>
<!-- 58&#45;&gt;59 -->
<g id="edge52" class="edge">
<title>58&#45;&gt;59</title>
<path fill="none" stroke="black" d="M1227.5,-287.7C1227.5,-279.98 1227.5,-270.71 1227.5,-262.11"/>
<polygon fill="black" stroke="black" points="1231,-262.1 1227.5,-252.1 1224,-262.1 1231,-262.1"/>
</g>
<!-- 60 -->
<g id="node52" class="node">
<title>60</title>
<polygon fill="none" stroke="black" points="1401,-180 1054,-180 1054,-144 1401,-144 1401,-180"/>
<text text-anchor="middle" x="1227.5" y="-158.3" font-family="Times,serif" font-size="14.00">reshape(·| newshape=[1, 14, 768], reverse=0)</text>
</g>
<!-- 59&#45;&gt;60 -->
<g id="edge53" class="edge">
<title>59&#45;&gt;60</title>
<path fill="none" stroke="black" d="M1227.5,-215.7C1227.5,-207.98 1227.5,-198.71 1227.5,-190.11"/>
<polygon fill="black" stroke="black" points="1231,-190.1 1227.5,-180.1 1224,-190.1 1231,-190.1"/>
</g>
<!-- 61 -->
<g id="node53" class="node">
<title>61</title>
<polygon fill="none" stroke="black" points="1270.5,-108 1184.5,-108 1184.5,-72 1270.5,-72 1270.5,-108"/>
<text text-anchor="middle" x="1227.5" y="-86.3" font-family="Times,serif" font-size="14.00">Tuple[...])</text>
</g>
<!-- 60&#45;&gt;61 -->
<g id="edge54" class="edge">
<title>60&#45;&gt;61</title>
<path fill="none" stroke="black" d="M1227.5,-143.7C1227.5,-135.98 1227.5,-126.71 1227.5,-118.11"/>
<polygon fill="black" stroke="black" points="1231,-118.1 1227.5,-108.1 1224,-118.1 1231,-118.1"/>
</g>
<!-- 62 -->
<g id="node54" class="node">
<title>62</title>
<polygon fill="none" stroke="black" points="1267.5,-36 1187.5,-36 1187.5,0 1267.5,0 1267.5,-36"/>
<text text-anchor="middle" x="1227.5" y="-14.3" font-family="Times,serif" font-size="14.00">Function</text>
</g>
<!-- 61&#45;&gt;62 -->
<g id="edge55" class="edge">
<title>61&#45;&gt;62</title>
<path fill="none" stroke="black" d="M1227.5,-71.7C1227.5,-63.98 1227.5,-54.71 1227.5,-46.11"/>
<polygon fill="black" stroke="black" points="1231,-46.1 1227.5,-36.1 1224,-46.1 1231,-46.1"/>
</g>
</g>
</svg>