Spaces:
Running
Running
Update app
Browse files
app.py
CHANGED
|
@@ -8,7 +8,11 @@ df = pd.read_csv(
|
|
| 8 |
)
|
| 9 |
|
| 10 |
markdown_text = """
|
| 11 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 12 |
"""
|
| 13 |
|
| 14 |
summary_urls = [
|
|
@@ -54,13 +58,21 @@ lb_wql = (
|
|
| 54 |
|
| 55 |
with gr.Blocks() as demo:
|
| 56 |
with gr.Tab("Leaderboard"):
|
| 57 |
-
gr.Markdown("
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 58 |
gr.Dataframe(
|
| 59 |
value=lb_mase,
|
| 60 |
interactive=False,
|
| 61 |
)
|
| 62 |
|
| 63 |
-
gr.Markdown("
|
| 64 |
gr.Dataframe(
|
| 65 |
value=lb_wql,
|
| 66 |
interactive=False,
|
|
|
|
| 8 |
)
|
| 9 |
|
| 10 |
markdown_text = """
|
| 11 |
+
This space hosts evaluation results for time series forecasting models.
|
| 12 |
+
|
| 13 |
+
Benchmark definitions, implementations of models, as well as the evaluation results for individual tasks are available under https://github.com/autogluon/fev.
|
| 14 |
+
|
| 15 |
+
Currently, the results in this space are a minimal proof of concept. Stay tuned for more benchmarks, results for new models and instructions on how to contribute your results.
|
| 16 |
"""
|
| 17 |
|
| 18 |
summary_urls = [
|
|
|
|
| 58 |
|
| 59 |
with gr.Blocks() as demo:
|
| 60 |
with gr.Tab("Leaderboard"):
|
| 61 |
+
gr.Markdown("""
|
| 62 |
+
## Chronos zero-shot benchmark results
|
| 63 |
+
|
| 64 |
+
This tab contains results for various forecasting models on the 28 datasets used in Benchmark II (zero-shot evaluation) in the publication [Chronos: Learning the Language of Time Series](https://arxiv.org/abs/2403.07815).
|
| 65 |
+
|
| 66 |
+
Task definitions and the detailed results are available on [GitHub](https://github.com/autogluon/fev/tree/main/benchmarks/chronos_zeroshot).
|
| 67 |
+
""")
|
| 68 |
+
gr.Markdown("""### Point forecast accuracy (measured by MASE)
|
| 69 |
+
""")
|
| 70 |
gr.Dataframe(
|
| 71 |
value=lb_mase,
|
| 72 |
interactive=False,
|
| 73 |
)
|
| 74 |
|
| 75 |
+
gr.Markdown("### Probabilistic forecast accuracy (measured by WQL)")
|
| 76 |
gr.Dataframe(
|
| 77 |
value=lb_wql,
|
| 78 |
interactive=False,
|