Spaces:
Running
Running
<div> <div id=9f507a17-fb27-4b9a-9224-34ffad9cd0d4 class=plotly-graph-div style="height:410px; width:1000px;"></div> <script>window.PLOTLYENV=window.PLOTLYENV||{},document.getElementById("9f507a17-fb27-4b9a-9224-34ffad9cd0d4")&&Plotly.newPlot("9f507a17-fb27-4b9a-9224-34ffad9cd0d4",[{legendgroup:"parameters",marker:{color:"#4ea5b7"},name:"parameters",showlegend:!0,x:["1024","2048","4096","8192","16384"],y:[2.3017578125,2.3017578125,2.3017578125,2.3017578125,2.3017578125],type:"bar",xaxis:"x",yaxis:"y"},{legendgroup:"gradients",marker:{color:"#e889ab"},name:"gradients",showlegend:!0,x:["1024","2048","4096","8192","16384"],y:[2.3017578125,2.3017578125,2.3017578125,2.3017578125,2.3017578125],type:"bar",xaxis:"x",yaxis:"y"},{legendgroup:"optimizer states",marker:{color:"#cec0fa"},name:"optimizer states",showlegend:!0,x:["1024","2048","4096","8192","16384"],y:[9.20703125,9.20703125,9.20703125,9.20703125,9.20703125],type:"bar",xaxis:"x",yaxis:"y"},{legendgroup:"activations",marker:{color:"#e38a42"},name:"activations",showlegend:!0,x:["1024","2048","4096","8192","16384"],y:[1.0625,2.125,4.25,8.5,17],type:"bar",xaxis:"x",yaxis:"y"},{legendgroup:"parameters",marker:{color:"#4ea5b7"},name:"parameters",showlegend:!1,x:["1024","2048","4096","8192","16384"],y:[14.95703125,14.95703125,14.95703125,14.95703125,14.95703125],type:"bar",xaxis:"x2",yaxis:"y2"},{legendgroup:"gradients",marker:{color:"#e889ab"},name:"gradients",showlegend:!1,x:["1024","2048","4096","8192","16384"],y:[14.95703125,14.95703125,14.95703125,14.95703125,14.95703125],type:"bar",xaxis:"x2",yaxis:"y2"},{legendgroup:"optimizer states",marker:{color:"#cec0fa"},name:"optimizer states",showlegend:!1,x:["1024","2048","4096","8192","16384"],y:[59.828125,59.828125,59.828125,59.828125,59.828125],type:"bar",xaxis:"x2",yaxis:"y2"},{legendgroup:"activations",marker:{color:"#e38a42"},name:"activations",showlegend:!1,x:["1024","2048","4096","8192","16384"],y:[4.25,8.5,17,34,68],type:"bar",xaxis:"x2",yaxis:"y2"},{legendgroup:"parameters",marker:{color:"#4ea5b7"},name:"parameters",showlegend:!1,x:["1024","2048","4096","8192","16384"],y:[131.4140625,131.4140625,131.4140625,131.4140625,131.4140625],type:"bar",xaxis:"x3",yaxis:"y3"},{legendgroup:"gradients",marker:{color:"#e889ab"},name:"gradients",showlegend:!1,x:["1024","2048","4096","8192","16384"],y:[131.4140625,131.4140625,131.4140625,131.4140625,131.4140625],type:"bar",xaxis:"x3",yaxis:"y3"},{legendgroup:"optimizer states",marker:{color:"#cec0fa"},name:"optimizer states",showlegend:!1,x:["1024","2048","4096","8192","16384"],y:[525.65625,525.65625,525.65625,525.65625,525.65625],type:"bar",xaxis:"x3",yaxis:"y3"},{legendgroup:"activations",marker:{color:"#e38a42"},name:"activations",showlegend:!1,x:["1024","2048","4096","8192","16384"],y:[21.25,42.5,85,170,340],type:"bar",xaxis:"x3",yaxis:"y3"}],{template:{data:{histogram2dcontour:[{type:"histogram2dcontour",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],choropleth:[{type:"choropleth",colorbar:{outlinewidth:0,ticks:""}}],histogram2d:[{type:"histogram2d",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],heatmap:[{type:"heatmap",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],heatmapgl:[{type:"heatmapgl",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],contourcarpet:[{type:"contourcarpet",colorbar:{outlinewidth:0,ticks:""}}],contour:[{type:"contour",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],surface:[{type:"surface",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],mesh3d:[{type:"mesh3d",colorbar:{outlinewidth:0,ticks:""}}],scatter:[{fillpattern:{fillmode:"overlay",size:10,solidity:.2},type:"scatter"}],parcoords:[{type:"parcoords",line:{colorbar:{outlinewidth:0,ticks:""}}}],scatterpolargl:[{type:"scatterpolargl",marker:{colorbar:{outlinewidth:0,ticks:""}}}],bar:[{error_x:{color:"#2a3f5f"},error_y:{color:"#2a3f5f"},marker:{line:{color:"#E5ECF6",width:.5},pattern:{fillmode:"overlay",size:10,solidity:.2}},type:"bar"}],scattergeo:[{type:"scattergeo",marker:{colorbar:{outlinewidth:0,ticks:""}}}],scatterpolar:[{type:"scatterpolar",marker:{colorbar:{outlinewidth:0,ticks:""}}}],histogram:[{marker:{pattern:{fillmode:"overlay",size:10,solidity:.2}},type:"histogram"}],scattergl:[{type:"scattergl",marker:{colorbar:{outlinewidth:0,ticks:""}}}],scatter3d:[{type:"scatter3d",line:{colorbar:{outlinewidth:0,ticks:""}},marker:{colorbar:{outlinewidth:0,ticks:""}}}],scattermapbox:[{type:"scattermapbox",marker:{colorbar:{outlinewidth:0,ticks:""}}}],scatterternary:[{type:"scatterternary",marker:{colorbar:{outlinewidth:0,ticks:""}}}],scattercarpet:[{type:"scattercarpet",marker:{colorbar:{outlinewidth:0,ticks:""}}}],carpet:[{aaxis:{endlinecolor:"#2a3f5f",gridcolor:"white",linecolor:"white",minorgridcolor:"white",startlinecolor:"#2a3f5f"},baxis:{endlinecolor:"#2a3f5f",gridcolor:"white",linecolor:"white",minorgridcolor:"white",startlinecolor:"#2a3f5f"},type:"carpet"}],table:[{cells:{fill:{color:"#EBF0F8"},line:{color:"white"}},header:{fill:{color:"#C8D4E3"},line:{color:"white"}},type:"table"}],barpolar:[{marker:{line:{color:"#E5ECF6",width:.5},pattern:{fillmode:"overlay",size:10,solidity:.2}},type:"barpolar"}],pie:[{automargin:!0,type:"pie"}]},layout:{autotypenumbers:"strict",colorway:["#636efa","#EF553B","#00cc96","#ab63fa","#FFA15A","#19d3f3","#FF6692","#B6E880","#FF97FF","#FECB52"],font:{color:"#2a3f5f"},hovermode:"closest",hoverlabel:{align:"left"},paper_bgcolor:"white",plot_bgcolor:"#E5ECF6",polar:{bgcolor:"#E5ECF6",angularaxis:{gridcolor:"white",linecolor:"white",ticks:""},radialaxis:{gridcolor:"white",linecolor:"white",ticks:""}},ternary:{bgcolor:"#E5ECF6",aaxis:{gridcolor:"white",linecolor:"white",ticks:""},baxis:{gridcolor:"white",linecolor:"white",ticks:""},caxis:{gridcolor:"white",linecolor:"white",ticks:""}},coloraxis:{colorbar:{outlinewidth:0,ticks:""}},colorscale:{sequential:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]],sequentialminus:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]],diverging:[[0,"#8e0152"],[.1,"#c51b7d"],[.2,"#de77ae"],[.3,"#f1b6da"],[.4,"#fde0ef"],[.5,"#f7f7f7"],[.6,"#e6f5d0"],[.7,"#b8e186"],[.8,"#7fbc41"],[.9,"#4d9221"],[1,"#276419"]]},xaxis:{gridcolor:"white",linecolor:"white",ticks:"",title:{standoff:15},zerolinecolor:"white",automargin:!0,zerolinewidth:2},yaxis:{gridcolor:"white",linecolor:"white",ticks:"",title:{standoff:15},zerolinecolor:"white",automargin:!0,zerolinewidth:2},scene:{xaxis:{backgroundcolor:"#E5ECF6",gridcolor:"white",linecolor:"white",showbackground:!0,ticks:"",zerolinecolor:"white",gridwidth:2},yaxis:{backgroundcolor:"#E5ECF6",gridcolor:"white",linecolor:"white",showbackground:!0,ticks:"",zerolinecolor:"white",gridwidth:2},zaxis:{backgroundcolor:"#E5ECF6",gridcolor:"white",linecolor:"white",showbackground:!0,ticks:"",zerolinecolor:"white",gridwidth:2}},shapedefaults:{line:{color:"#2a3f5f"}},annotationdefaults:{arrowcolor:"#2a3f5f",arrowhead:0,arrowwidth:1},geo:{bgcolor:"white",landcolor:"#E5ECF6",subunitcolor:"white",showland:!0,showlakes:!0,lakecolor:"white"},title:{x:.05},mapbox:{style:"light"}}},xaxis:{anchor:"y",domain:[0,.2888888888888889]},yaxis:{anchor:"x",domain:[0,1],range:[0,150],title:{text:"GB memory"}},xaxis2:{anchor:"y2",domain:[.35555555555555557,.6444444444444445]},yaxis2:{anchor:"x2",domain:[0,1],matches:"y",showticklabels:!1,range:[0,150]},xaxis3:{anchor:"y3",domain:[.7111111111111111,1]},yaxis3:{anchor:"x3",domain:[0,1],matches:"y",showticklabels:!1,range:[0,150]},annotations:[{font:{size:16},showarrow:!1,text:"1B model",x:.14444444444444446,xanchor:"center",xref:"paper",y:1,yanchor:"bottom",yref:"paper"},{font:{size:16},showarrow:!1,text:"8B model",x:.5,xanchor:"center",xref:"paper",y:1,yanchor:"bottom",yref:"paper"},{font:{size:16},showarrow:!1,text:"70B model",x:.8555555555555556,xanchor:"center",xref:"paper",y:1,yanchor:"bottom",yref:"paper"}],shapes:[{line:{color:"red",dash:"dash"},type:"line",x0:0,x1:1,xref:"x domain",y0:80,y1:80,yref:"y"},{line:{color:"red",dash:"dash"},type:"line",x0:0,x1:1,xref:"x2 domain",y0:80,y1:80,yref:"y2"},{line:{color:"red",dash:"dash"},type:"line",x0:0,x1:1,xref:"x3 domain",y0:80,y1:80,yref:"y3"}],title:{text:"Memory Usage vs Sequence Length for Different Model Sizes"},legend:{orientation:"v",x:1.02,y:.5},margin:{r:150},barmode:"stack",width:1e3,height:410},{responsive:!0})</script> </div> |