ultrascale-playbook / dist /fragments /tp_sp_memoryusage.html
hynky's picture
hynky HF staff
add dist + nits
1fa3117
raw
history blame
10.2 kB
<div> <div id=16242941-9fab-40ed-996e-ddd93a5a627c class=plotly-graph-div style="height:410px; width:1000px;"></div> <script>window.PLOTLYENV=window.PLOTLYENV||{},document.getElementById("16242941-9fab-40ed-996e-ddd93a5a627c")&&Plotly.newPlot("16242941-9fab-40ed-996e-ddd93a5a627c",[{legendgroup:"Model Parameters",marker:{color:"#4ea5b7"},name:"Model Parameters",showlegend:!0,x:["1024","4096","16384"],y:[131.5,131.5,131.5],type:"bar",xaxis:"x",yaxis:"y"},{legendgroup:"Model Parameters",marker:{color:"#4ea5b7"},name:"Model Parameters",showlegend:!1,x:["1024","4096","16384"],y:[16.4375,16.4375,16.4375],type:"bar",xaxis:"x2",yaxis:"y2"},{legendgroup:"Model Parameters",marker:{color:"#4ea5b7"},name:"Model Parameters",showlegend:!1,x:["1024","4096","16384"],y:[8.21875,8.21875,8.21875],type:"bar",xaxis:"x3",yaxis:"y3"},{legendgroup:"Gradients",marker:{color:"#e889ab"},name:"Gradients",showlegend:!0,x:["1024","4096","16384"],y:[131.5,131.5,131.5],type:"bar",xaxis:"x",yaxis:"y"},{legendgroup:"Gradients",marker:{color:"#e889ab"},name:"Gradients",showlegend:!1,x:["1024","4096","16384"],y:[16.4375,16.4375,16.4375],type:"bar",xaxis:"x2",yaxis:"y2"},{legendgroup:"Gradients",marker:{color:"#e889ab"},name:"Gradients",showlegend:!1,x:["1024","4096","16384"],y:[8.21875,8.21875,8.21875],type:"bar",xaxis:"x3",yaxis:"y3"},{legendgroup:"Optimizer States",marker:{color:"#cec0fa"},name:"Optimizer States",showlegend:!0,x:["1024","4096","16384"],y:[526,526,526],type:"bar",xaxis:"x",yaxis:"y"},{legendgroup:"Optimizer States",marker:{color:"#cec0fa"},name:"Optimizer States",showlegend:!1,x:["1024","4096","16384"],y:[65.75,65.75,65.75],type:"bar",xaxis:"x2",yaxis:"y2"},{legendgroup:"Optimizer States",marker:{color:"#cec0fa"},name:"Optimizer States",showlegend:!1,x:["1024","4096","16384"],y:[32.875,32.875,32.875],type:"bar",xaxis:"x3",yaxis:"y3"},{legendgroup:"Activations",marker:{color:"#e38a42"},name:"Activations",showlegend:!0,x:["1024","4096","16384"],y:[21.25,85,340],type:"bar",xaxis:"x",yaxis:"y"},{legendgroup:"Activations",marker:{color:"#e38a42"},name:"Activations",showlegend:!1,x:["1024","4096","16384"],y:[2.65625,10.625,42.5],type:"bar",xaxis:"x2",yaxis:"y2"},{legendgroup:"Activations",marker:{color:"#e38a42"},name:"Activations",showlegend:!1,x:["1024","4096","16384"],y:[1.328125,5.3125,21.25],type:"bar",xaxis:"x3",yaxis:"y3"}],{template:{data:{histogram2dcontour:[{type:"histogram2dcontour",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],choropleth:[{type:"choropleth",colorbar:{outlinewidth:0,ticks:""}}],histogram2d:[{type:"histogram2d",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],heatmap:[{type:"heatmap",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],heatmapgl:[{type:"heatmapgl",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],contourcarpet:[{type:"contourcarpet",colorbar:{outlinewidth:0,ticks:""}}],contour:[{type:"contour",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],surface:[{type:"surface",colorbar:{outlinewidth:0,ticks:""},colorscale:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]]}],mesh3d:[{type:"mesh3d",colorbar:{outlinewidth:0,ticks:""}}],scatter:[{fillpattern:{fillmode:"overlay",size:10,solidity:.2},type:"scatter"}],parcoords:[{type:"parcoords",line:{colorbar:{outlinewidth:0,ticks:""}}}],scatterpolargl:[{type:"scatterpolargl",marker:{colorbar:{outlinewidth:0,ticks:""}}}],bar:[{error_x:{color:"#2a3f5f"},error_y:{color:"#2a3f5f"},marker:{line:{color:"#E5ECF6",width:.5},pattern:{fillmode:"overlay",size:10,solidity:.2}},type:"bar"}],scattergeo:[{type:"scattergeo",marker:{colorbar:{outlinewidth:0,ticks:""}}}],scatterpolar:[{type:"scatterpolar",marker:{colorbar:{outlinewidth:0,ticks:""}}}],histogram:[{marker:{pattern:{fillmode:"overlay",size:10,solidity:.2}},type:"histogram"}],scattergl:[{type:"scattergl",marker:{colorbar:{outlinewidth:0,ticks:""}}}],scatter3d:[{type:"scatter3d",line:{colorbar:{outlinewidth:0,ticks:""}},marker:{colorbar:{outlinewidth:0,ticks:""}}}],scattermapbox:[{type:"scattermapbox",marker:{colorbar:{outlinewidth:0,ticks:""}}}],scatterternary:[{type:"scatterternary",marker:{colorbar:{outlinewidth:0,ticks:""}}}],scattercarpet:[{type:"scattercarpet",marker:{colorbar:{outlinewidth:0,ticks:""}}}],carpet:[{aaxis:{endlinecolor:"#2a3f5f",gridcolor:"white",linecolor:"white",minorgridcolor:"white",startlinecolor:"#2a3f5f"},baxis:{endlinecolor:"#2a3f5f",gridcolor:"white",linecolor:"white",minorgridcolor:"white",startlinecolor:"#2a3f5f"},type:"carpet"}],table:[{cells:{fill:{color:"#EBF0F8"},line:{color:"white"}},header:{fill:{color:"#C8D4E3"},line:{color:"white"}},type:"table"}],barpolar:[{marker:{line:{color:"#E5ECF6",width:.5},pattern:{fillmode:"overlay",size:10,solidity:.2}},type:"barpolar"}],pie:[{automargin:!0,type:"pie"}]},layout:{autotypenumbers:"strict",colorway:["#636efa","#EF553B","#00cc96","#ab63fa","#FFA15A","#19d3f3","#FF6692","#B6E880","#FF97FF","#FECB52"],font:{color:"#2a3f5f"},hovermode:"closest",hoverlabel:{align:"left"},paper_bgcolor:"white",plot_bgcolor:"#E5ECF6",polar:{bgcolor:"#E5ECF6",angularaxis:{gridcolor:"white",linecolor:"white",ticks:""},radialaxis:{gridcolor:"white",linecolor:"white",ticks:""}},ternary:{bgcolor:"#E5ECF6",aaxis:{gridcolor:"white",linecolor:"white",ticks:""},baxis:{gridcolor:"white",linecolor:"white",ticks:""},caxis:{gridcolor:"white",linecolor:"white",ticks:""}},coloraxis:{colorbar:{outlinewidth:0,ticks:""}},colorscale:{sequential:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]],sequentialminus:[[0,"#0d0887"],[.1111111111111111,"#46039f"],[.2222222222222222,"#7201a8"],[.3333333333333333,"#9c179e"],[.4444444444444444,"#bd3786"],[.5555555555555556,"#d8576b"],[.6666666666666666,"#ed7953"],[.7777777777777778,"#fb9f3a"],[.8888888888888888,"#fdca26"],[1,"#f0f921"]],diverging:[[0,"#8e0152"],[.1,"#c51b7d"],[.2,"#de77ae"],[.3,"#f1b6da"],[.4,"#fde0ef"],[.5,"#f7f7f7"],[.6,"#e6f5d0"],[.7,"#b8e186"],[.8,"#7fbc41"],[.9,"#4d9221"],[1,"#276419"]]},xaxis:{gridcolor:"white",linecolor:"white",ticks:"",title:{standoff:15},zerolinecolor:"white",automargin:!0,zerolinewidth:2},yaxis:{gridcolor:"white",linecolor:"white",ticks:"",title:{standoff:15},zerolinecolor:"white",automargin:!0,zerolinewidth:2},scene:{xaxis:{backgroundcolor:"#E5ECF6",gridcolor:"white",linecolor:"white",showbackground:!0,ticks:"",zerolinecolor:"white",gridwidth:2},yaxis:{backgroundcolor:"#E5ECF6",gridcolor:"white",linecolor:"white",showbackground:!0,ticks:"",zerolinecolor:"white",gridwidth:2},zaxis:{backgroundcolor:"#E5ECF6",gridcolor:"white",linecolor:"white",showbackground:!0,ticks:"",zerolinecolor:"white",gridwidth:2}},shapedefaults:{line:{color:"#2a3f5f"}},annotationdefaults:{arrowcolor:"#2a3f5f",arrowhead:0,arrowwidth:1},geo:{bgcolor:"white",landcolor:"#E5ECF6",subunitcolor:"white",showland:!0,showlakes:!0,lakecolor:"white"},title:{x:.05},mapbox:{style:"light"}}},xaxis:{anchor:"y",domain:[0,.2888888888888889],title:{text:"Sequence Length"},showgrid:!0,gridcolor:"LightGray"},yaxis:{anchor:"x",domain:[0,1],range:[0,150],dtick:20,showgrid:!0,gridcolor:"LightGray",title:{text:"Memory Usage (GB)"}},xaxis2:{anchor:"y2",domain:[.35555555555555557,.6444444444444445],title:{text:"Sequence Length"},showgrid:!0,gridcolor:"LightGray"},yaxis2:{anchor:"x2",domain:[0,1],matches:"y",showticklabels:!1,range:[0,150],dtick:20,showgrid:!0,gridcolor:"LightGray"},xaxis3:{anchor:"y3",domain:[.7111111111111111,1],title:{text:"Sequence Length"},showgrid:!0,gridcolor:"LightGray"},yaxis3:{anchor:"x3",domain:[0,1],matches:"y",showticklabels:!1,range:[0,150],dtick:20,showgrid:!0,gridcolor:"LightGray"},annotations:[{font:{size:16},showarrow:!1,text:"No Parallelism",x:.14444444444444446,xanchor:"center",xref:"paper",y:1,yanchor:"bottom",yref:"paper"},{font:{size:16},showarrow:!1,text:"TP=8 (with SP)",x:.5,xanchor:"center",xref:"paper",y:1,yanchor:"bottom",yref:"paper"},{font:{size:16},showarrow:!1,text:"TP=16 (with SP)",x:.8555555555555556,xanchor:"center",xref:"paper",y:1,yanchor:"bottom",yref:"paper"}],shapes:[{line:{color:"red",dash:"dash"},type:"line",x0:0,x1:1,xref:"x domain",y0:80,y1:80,yref:"y"},{line:{color:"red",dash:"dash"},type:"line",x0:0,x1:1,xref:"x2 domain",y0:80,y1:80,yref:"y2"},{line:{color:"red",dash:"dash"},type:"line",x0:0,x1:1,xref:"x3 domain",y0:80,y1:80,yref:"y3"}],title:{text:"Memory Usage for 70B Model"},legend:{orientation:"v",x:1.02,y:.5},margin:{r:150},barmode:"stack",width:1e3,height:410},{responsive:!0})</script> </div>