shchuro commited on
Commit
732efe6
·
1 Parent(s): d4a7fd1

Update app

Browse files
Files changed (1) hide show
  1. app.py +15 -3
app.py CHANGED
@@ -8,7 +8,11 @@ df = pd.read_csv(
8
  )
9
 
10
  markdown_text = """
11
- Hello world
 
 
 
 
12
  """
13
 
14
  summary_urls = [
@@ -54,13 +58,21 @@ lb_wql = (
54
 
55
  with gr.Blocks() as demo:
56
  with gr.Tab("Leaderboard"):
57
- gr.Markdown("## Point forecast accuracy (measured by MASE)")
 
 
 
 
 
 
 
 
58
  gr.Dataframe(
59
  value=lb_mase,
60
  interactive=False,
61
  )
62
 
63
- gr.Markdown("## Probabilistic forecast accuracy (measured by WQL)")
64
  gr.Dataframe(
65
  value=lb_wql,
66
  interactive=False,
 
8
  )
9
 
10
  markdown_text = """
11
+ This space hosts evaluation results for time series forecasting models.
12
+
13
+ Benchmark definitions, implementations of models, as well as the evaluation results for individual tasks are available under https://github.com/autogluon/fev.
14
+
15
+ Currently, the results in this space are a minimal proof of concept. Stay tuned for more benchmarks, results for new models and instructions on how to contribute your results.
16
  """
17
 
18
  summary_urls = [
 
58
 
59
  with gr.Blocks() as demo:
60
  with gr.Tab("Leaderboard"):
61
+ gr.Markdown("""
62
+ ## Chronos zero-shot benchmark results
63
+
64
+ This tab contains results for various forecasting models on the 28 datasets used in Benchmark II (zero-shot evaluation) in the publication [Chronos: Learning the Language of Time Series](https://arxiv.org/abs/2403.07815).
65
+
66
+ Task definitions and the detailed results are available on [GitHub](https://github.com/autogluon/fev/tree/main/benchmarks/chronos_zeroshot).
67
+ """)
68
+ gr.Markdown("""### Point forecast accuracy (measured by MASE)
69
+ """)
70
  gr.Dataframe(
71
  value=lb_mase,
72
  interactive=False,
73
  )
74
 
75
+ gr.Markdown("### Probabilistic forecast accuracy (measured by WQL)")
76
  gr.Dataframe(
77
  value=lb_wql,
78
  interactive=False,