update formula and default inupt
Browse files
app.py
CHANGED
@@ -359,8 +359,8 @@ formula = r"""
|
|
359 |
|
360 |
$$
|
361 |
{Model\ states} =
|
362 |
-
(6 + \frac{12}{dp}) \times
|
363 |
-
(\frac{(\frac{
|
364 |
$$
|
365 |
|
366 |
$$
|
@@ -505,7 +505,7 @@ with gr.Blocks() as demo:
|
|
505 |
)
|
506 |
with gr.Accordion("Parallelism config"):
|
507 |
# with gr.Row():
|
508 |
-
dp = gr.Number(label="Data parallelism", value=
|
509 |
tp = gr.Number(label="Tensor parallelism", value=2)
|
510 |
pp = gr.Number(label="Pipeline parallelism", value=2)
|
511 |
cp = gr.Number(label="Context parallelism", value=2)
|
@@ -580,4 +580,4 @@ with gr.Blocks() as demo:
|
|
580 |
|
581 |
|
582 |
if __name__ == "__main__":
|
583 |
-
demo.launch(allowed_paths=["/"])
|
|
|
359 |
|
360 |
$$
|
361 |
{Model\ states} =
|
362 |
+
(6 + \frac{12}{dp \times cp}) \times
|
363 |
+
(\frac{(\frac{4H^2 + 3H \times FFN}{tp} + 2H) \times L}{pp} + \frac{HV}{tp} + HS)
|
364 |
$$
|
365 |
|
366 |
$$
|
|
|
505 |
)
|
506 |
with gr.Accordion("Parallelism config"):
|
507 |
# with gr.Row():
|
508 |
+
dp = gr.Number(label="Data parallelism", value=2)
|
509 |
tp = gr.Number(label="Tensor parallelism", value=2)
|
510 |
pp = gr.Number(label="Pipeline parallelism", value=2)
|
511 |
cp = gr.Number(label="Context parallelism", value=2)
|
|
|
580 |
|
581 |
|
582 |
if __name__ == "__main__":
|
583 |
+
demo.launch(share=False, allowed_paths=["/"])
|