Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -12,12 +12,12 @@ def plot_forecast(num_param, batch_size, precision, seq_len):
|
|
12 |
# Model Parameters: N×precision
|
13 |
y1 = num_param * precision / (1024**3)
|
14 |
|
15 |
-
# Optimizer States: 2×N×precision
|
16 |
-
y2 = 2 * num_param * precision / (1024**3)
|
17 |
-
|
18 |
# Activations: B×Sequence Length×K×precision
|
19 |
K = 4.6894e-04 * num_param + 1.8494e06
|
20 |
-
|
|
|
|
|
|
|
21 |
|
22 |
# Gradients: N×precision
|
23 |
y4 = num_param * 4 / (1024**3)
|
@@ -33,8 +33,8 @@ def plot_forecast(num_param, batch_size, precision, seq_len):
|
|
33 |
|
34 |
# Add text labels inside the bars
|
35 |
ax.text(0, y1 / 2, "Model Parameters", ha="center", va="center", color="white", fontweight="bold")
|
36 |
-
ax.text(0, y1 + y2 / 2,
|
37 |
-
ax.text(0, y1 + y2 + y3 / 2, "
|
38 |
ax.text(0, y1 + y2 + y3 + y4 / 2, "Gradients", ha="center", va="center", color="white", fontweight="bold")
|
39 |
|
40 |
# remove x axis
|
|
|
12 |
# Model Parameters: N×precision
|
13 |
y1 = num_param * precision / (1024**3)
|
14 |
|
|
|
|
|
|
|
15 |
# Activations: B×Sequence Length×K×precision
|
16 |
K = 4.6894e-04 * num_param + 1.8494e06
|
17 |
+
y2 = batch_size * seq_len * K * precision / (1024**3)
|
18 |
+
|
19 |
+
# Optimizer States: 2×N×precision
|
20 |
+
y3 = 2 * num_param * precision / (1024**3)
|
21 |
|
22 |
# Gradients: N×precision
|
23 |
y4 = num_param * 4 / (1024**3)
|
|
|
33 |
|
34 |
# Add text labels inside the bars
|
35 |
ax.text(0, y1 / 2, "Model Parameters", ha="center", va="center", color="white", fontweight="bold")
|
36 |
+
ax.text(0, y1 + y2 / 2,"Activations", ha="center", va="center", color="white", fontweight="bold")
|
37 |
+
ax.text(0, y1 + y2 + y3 / 2, "Optimizer States", ha="center", va="center", color="white", fontweight="bold")
|
38 |
ax.text(0, y1 + y2 + y3 + y4 / 2, "Gradients", ha="center", va="center", color="white", fontweight="bold")
|
39 |
|
40 |
# remove x axis
|