Spaces:
Running
Running
Update app
Browse files
app.py
CHANGED
@@ -8,7 +8,11 @@ df = pd.read_csv(
|
|
8 |
)
|
9 |
|
10 |
markdown_text = """
|
11 |
-
|
|
|
|
|
|
|
|
|
12 |
"""
|
13 |
|
14 |
summary_urls = [
|
@@ -54,13 +58,21 @@ lb_wql = (
|
|
54 |
|
55 |
with gr.Blocks() as demo:
|
56 |
with gr.Tab("Leaderboard"):
|
57 |
-
gr.Markdown("
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
58 |
gr.Dataframe(
|
59 |
value=lb_mase,
|
60 |
interactive=False,
|
61 |
)
|
62 |
|
63 |
-
gr.Markdown("
|
64 |
gr.Dataframe(
|
65 |
value=lb_wql,
|
66 |
interactive=False,
|
|
|
8 |
)
|
9 |
|
10 |
markdown_text = """
|
11 |
+
This space hosts evaluation results for time series forecasting models.
|
12 |
+
|
13 |
+
Benchmark definitions, implementations of models, as well as the evaluation results for individual tasks are available under https://github.com/autogluon/fev.
|
14 |
+
|
15 |
+
Currently, the results in this space are a minimal proof of concept. Stay tuned for more benchmarks, results for new models and instructions on how to contribute your results.
|
16 |
"""
|
17 |
|
18 |
summary_urls = [
|
|
|
58 |
|
59 |
with gr.Blocks() as demo:
|
60 |
with gr.Tab("Leaderboard"):
|
61 |
+
gr.Markdown("""
|
62 |
+
## Chronos zero-shot benchmark results
|
63 |
+
|
64 |
+
This tab contains results for various forecasting models on the 28 datasets used in Benchmark II (zero-shot evaluation) in the publication [Chronos: Learning the Language of Time Series](https://arxiv.org/abs/2403.07815).
|
65 |
+
|
66 |
+
Task definitions and the detailed results are available on [GitHub](https://github.com/autogluon/fev/tree/main/benchmarks/chronos_zeroshot).
|
67 |
+
""")
|
68 |
+
gr.Markdown("""### Point forecast accuracy (measured by MASE)
|
69 |
+
""")
|
70 |
gr.Dataframe(
|
71 |
value=lb_mase,
|
72 |
interactive=False,
|
73 |
)
|
74 |
|
75 |
+
gr.Markdown("### Probabilistic forecast accuracy (measured by WQL)")
|
76 |
gr.Dataframe(
|
77 |
value=lb_wql,
|
78 |
interactive=False,
|