qgallouedec HF staff commited on
Commit
db805e9
·
verified ·
1 Parent(s): c98b4d9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -6
app.py CHANGED
@@ -12,12 +12,12 @@ def plot_forecast(num_param, batch_size, precision, seq_len):
12
  # Model Parameters: N×precision
13
  y1 = num_param * precision / (1024**3)
14
 
15
- # Optimizer States: 2×N×precision
16
- y2 = 2 * num_param * precision / (1024**3)
17
-
18
  # Activations: B×Sequence Length×K×precision
19
  K = 4.6894e-04 * num_param + 1.8494e06
20
- y3 = batch_size * seq_len * K * precision / (1024**3)
 
 
 
21
 
22
  # Gradients: N×precision
23
  y4 = num_param * 4 / (1024**3)
@@ -33,8 +33,8 @@ def plot_forecast(num_param, batch_size, precision, seq_len):
33
 
34
  # Add text labels inside the bars
35
  ax.text(0, y1 / 2, "Model Parameters", ha="center", va="center", color="white", fontweight="bold")
36
- ax.text(0, y1 + y2 / 2, "Optimizer States", ha="center", va="center", color="white", fontweight="bold")
37
- ax.text(0, y1 + y2 + y3 / 2, "Activations", ha="center", va="center", color="white", fontweight="bold")
38
  ax.text(0, y1 + y2 + y3 + y4 / 2, "Gradients", ha="center", va="center", color="white", fontweight="bold")
39
 
40
  # remove x axis
 
12
  # Model Parameters: N×precision
13
  y1 = num_param * precision / (1024**3)
14
 
 
 
 
15
  # Activations: B×Sequence Length×K×precision
16
  K = 4.6894e-04 * num_param + 1.8494e06
17
+ y2 = batch_size * seq_len * K * precision / (1024**3)
18
+
19
+ # Optimizer States: 2×N×precision
20
+ y3 = 2 * num_param * precision / (1024**3)
21
 
22
  # Gradients: N×precision
23
  y4 = num_param * 4 / (1024**3)
 
33
 
34
  # Add text labels inside the bars
35
  ax.text(0, y1 / 2, "Model Parameters", ha="center", va="center", color="white", fontweight="bold")
36
+ ax.text(0, y1 + y2 / 2,"Activations", ha="center", va="center", color="white", fontweight="bold")
37
+ ax.text(0, y1 + y2 + y3 / 2, "Optimizer States", ha="center", va="center", color="white", fontweight="bold")
38
  ax.text(0, y1 + y2 + y3 + y4 / 2, "Gradients", ha="center", va="center", color="white", fontweight="bold")
39
 
40
  # remove x axis