Jack Monas
commited on
Commit
·
254ddce
1
Parent(s):
b3e6d70
rules
Browse files
app.py
CHANGED
@@ -2,125 +2,113 @@ import streamlit as st
|
|
2 |
import pandas as pd
|
3 |
import streamlit.components.v1 as components
|
4 |
|
5 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6 |
st.title("World Model Challenge")
|
7 |
-
st.
|
8 |
st.write(
|
9 |
-
"Welcome to the World Model Challenge server. This platform hosts three challenges "
|
10 |
-
"
|
11 |
)
|
12 |
|
13 |
-
|
14 |
-
|
15 |
-
st.
|
16 |
st.write(
|
17 |
-
"Real-world robotics faces a
|
18 |
-
"
|
19 |
-
"learning to simulate complex real-world interactions from raw sensor data. We believe these learned simulators will enable "
|
20 |
-
"robust evaluation and iterative improvement of robot policies without the constraints of a physical testbed."
|
21 |
)
|
22 |
|
23 |
-
|
24 |
-
|
25 |
-
st.
|
26 |
-
|
|
|
27 |
st.write(
|
28 |
-
"
|
|
|
29 |
)
|
30 |
-
|
|
|
31 |
st.write(
|
32 |
-
"In the Sampling Challenge,
|
|
|
33 |
)
|
34 |
-
|
|
|
35 |
st.write(
|
36 |
-
"
|
|
|
|
|
37 |
)
|
38 |
|
39 |
-
|
40 |
-
|
41 |
-
st.
|
42 |
st.write(
|
43 |
-
"We offer two key datasets
|
44 |
-
"**Raw Data:** The [world_model_raw_data](https://huggingface.co/datasets/1x-technologies/world_model_raw_data) dataset "
|
45 |
-
"
|
46 |
-
"
|
47 |
-
"and is
|
48 |
-
"**Tokenized Data:** The [world_model_tokenized_data](https://huggingface.co/datasets/1x-technologies/world_model_tokenized_data) dataset "
|
49 |
-
"tokenizes the raw video sequences generated using the NVIDIA Cosmos Tokenizer. This compact representation of the raw data "
|
50 |
-
"is optimal for the Compression Challenge and is released under the Apache 2.0 license.\n\n"
|
51 |
)
|
52 |
|
53 |
-
|
54 |
-
|
55 |
-
st.
|
56 |
st.write(
|
57 |
"Our scoring system rewards performance in all three challenges, with extra emphasis on the Evaluation Challenge. "
|
58 |
-
"A team's final rank is
|
59 |
)
|
60 |
-
|
|
|
61 |
col1, col2, col3 = st.columns(3)
|
62 |
|
63 |
with col1:
|
64 |
st.markdown('<h3 style="margin-left:20px;">Compression</h3>', unsafe_allow_html=True)
|
65 |
st.markdown(
|
66 |
"""
|
67 |
-
- **1st Place
|
68 |
-
- **2nd Place
|
69 |
-
- **3rd Place
|
70 |
"""
|
71 |
)
|
72 |
-
|
73 |
with col2:
|
74 |
st.markdown('<h3 style="margin-left:20px;">Sampling</h3>', unsafe_allow_html=True)
|
75 |
st.markdown(
|
76 |
"""
|
77 |
-
- **1st Place
|
78 |
-
- **2nd Place
|
79 |
-
- **3rd Place
|
80 |
"""
|
81 |
)
|
82 |
-
|
83 |
with col3:
|
84 |
st.markdown('<h3 style="margin-left:20px;">Evaluation</h3>', unsafe_allow_html=True)
|
85 |
st.markdown(
|
86 |
"""
|
87 |
-
- **1st Place
|
88 |
-
- **2nd Place
|
89 |
-
- **3rd Place
|
90 |
"""
|
91 |
)
|
|
|
92 |
with st.expander("Tie-Breakers"):
|
93 |
st.write(
|
94 |
-
"The overall winner will be the team with the highest total points. "
|
95 |
"In the event of a tie, the following tie-breakers will be applied in order:\n\n"
|
96 |
"1. Highest Evaluation Challenge score\n"
|
97 |
"2. Highest Sampling Challenge score\n"
|
98 |
-
"3. Highest Compression Challenge score
|
99 |
)
|
|
|
100 |
st.write(
|
101 |
-
"The leaderboard, which shows the total points across all challenges, will go live on **March 10th**. "
|
102 |
-
"
|
103 |
-
"respective Hugging Face submission servers."
|
104 |
)
|
105 |
-
|
106 |
-
def main():
|
107 |
-
st.set_page_config(page_title="World Model Challenge")
|
108 |
-
|
109 |
-
# Sidebar navigation
|
110 |
-
st.sidebar.title("Navigation")
|
111 |
-
section = st.sidebar.radio("Jump to Section",
|
112 |
-
["Overview", "Motivation", "Challenges", "Datasets", "Scoring"])
|
113 |
-
|
114 |
-
if section == "Overview":
|
115 |
-
overview_section()
|
116 |
-
elif section == "Motivation":
|
117 |
-
motivation_section()
|
118 |
-
elif section == "Challenges":
|
119 |
-
challenges_section()
|
120 |
-
elif section == "Datasets":
|
121 |
-
datasets_section()
|
122 |
-
elif section == "Scoring":
|
123 |
-
scoring_section()
|
124 |
-
|
125 |
-
if __name__ == '__main__':
|
126 |
-
main()
|
|
|
2 |
import pandas as pd
|
3 |
import streamlit.components.v1 as components
|
4 |
|
5 |
+
# Set up page configuration
|
6 |
+
st.set_page_config(page_title="World Model Challenge", layout="wide")
|
7 |
+
|
8 |
+
# Sidebar Navigation
|
9 |
+
st.sidebar.title("Navigation")
|
10 |
+
section = st.sidebar.radio("Jump to Section",
|
11 |
+
["Overview", "Motivation", "Challenges", "Datasets", "Scoring"])
|
12 |
+
|
13 |
+
# Overview Section
|
14 |
+
if section == "Overview":
|
15 |
st.title("World Model Challenge")
|
16 |
+
st.header("Welcome")
|
17 |
st.write(
|
18 |
+
"Welcome to the World Model Challenge server. This platform hosts three challenges designed to advance research in world models for robotics: "
|
19 |
+
"Compression, Sampling, and Evaluation."
|
20 |
)
|
21 |
|
22 |
+
# Motivation Section
|
23 |
+
elif section == "Motivation":
|
24 |
+
st.header("Motivation")
|
25 |
st.write(
|
26 |
+
"Real-world robotics faces a constant challenge—environments are dynamic and ever-changing, which makes it difficult to reliably evaluate robot performance. "
|
27 |
+
"World models address this by learning to simulate complex interactions from raw sensor data. These learned simulators allow for robust testing and continuous improvement of robot policies without the limitations of physical testing."
|
|
|
|
|
28 |
)
|
29 |
|
30 |
+
# Challenges Section
|
31 |
+
elif section == "Challenges":
|
32 |
+
st.header("The Challenges")
|
33 |
+
|
34 |
+
st.subheader("Compression Challenge")
|
35 |
st.write(
|
36 |
+
"Your task is to train a model to compress our robots' logs effectively while preserving critical details needed to understand and predict future interactions. "
|
37 |
+
"Performance is measured by the model's loss—the lower the loss, the better it captures real-world complexities."
|
38 |
)
|
39 |
+
|
40 |
+
st.subheader("Sampling Challenge")
|
41 |
st.write(
|
42 |
+
"In the Sampling Challenge, predict a video frame two seconds ahead given a short clip of robot interactions. "
|
43 |
+
"The goal is to create a coherent and plausible continuation that accurately reflects scene dynamics. Submissions are judged by how closely they match the actual frame."
|
44 |
)
|
45 |
+
|
46 |
+
st.subheader("Evaluation Challenge")
|
47 |
st.write(
|
48 |
+
"This challenge asks: Can you predict a robot's real-world performance without physically deploying it? "
|
49 |
+
"You'll be given several policies for a specific task and must rank them by expected performance. "
|
50 |
+
"Your ranking is then compared to the true ranking of the policies."
|
51 |
)
|
52 |
|
53 |
+
# Datasets Section
|
54 |
+
elif section == "Datasets":
|
55 |
+
st.header("Datasets")
|
56 |
st.write(
|
57 |
+
"We offer two key datasets for the 1X World Model Challenge:\n\n"
|
58 |
+
"**Raw Data:** The [world_model_raw_data](https://huggingface.co/datasets/1x-technologies/world_model_raw_data) dataset provides raw sensor data, video logs, and annotated robot state sequences from diverse real-world scenarios. "
|
59 |
+
"It is split into 100 shards—each containing a 512x512 MP4 video, a segment index mapping, and state arrays—and is licensed under CC-BY-NC-SA 4.0.\n\n"
|
60 |
+
"**Tokenized Data:** The [world_model_tokenized_data](https://huggingface.co/datasets/1x-technologies/world_model_tokenized_data) dataset tokenizes raw video sequences using the NVIDIA Cosmos Tokenizer. "
|
61 |
+
"This compact representation is optimal for the Compression Challenge and is released under the Apache 2.0 license."
|
|
|
|
|
|
|
62 |
)
|
63 |
|
64 |
+
# Scoring Section
|
65 |
+
elif section == "Scoring":
|
66 |
+
st.header("Scoring")
|
67 |
st.write(
|
68 |
"Our scoring system rewards performance in all three challenges, with extra emphasis on the Evaluation Challenge. "
|
69 |
+
"A team's final rank is based on the total points earned across the challenges."
|
70 |
)
|
71 |
+
|
72 |
+
st.subheader("Points Breakdown")
|
73 |
col1, col2, col3 = st.columns(3)
|
74 |
|
75 |
with col1:
|
76 |
st.markdown('<h3 style="margin-left:20px;">Compression</h3>', unsafe_allow_html=True)
|
77 |
st.markdown(
|
78 |
"""
|
79 |
+
- **1st Place:** 10 points
|
80 |
+
- **2nd Place:** 7 points
|
81 |
+
- **3rd Place:** 5 points
|
82 |
"""
|
83 |
)
|
|
|
84 |
with col2:
|
85 |
st.markdown('<h3 style="margin-left:20px;">Sampling</h3>', unsafe_allow_html=True)
|
86 |
st.markdown(
|
87 |
"""
|
88 |
+
- **1st Place:** 10 points
|
89 |
+
- **2nd Place:** 7 points
|
90 |
+
- **3rd Place:** 5 points
|
91 |
"""
|
92 |
)
|
|
|
93 |
with col3:
|
94 |
st.markdown('<h3 style="margin-left:20px;">Evaluation</h3>', unsafe_allow_html=True)
|
95 |
st.markdown(
|
96 |
"""
|
97 |
+
- **1st Place:** 20 points
|
98 |
+
- **2nd Place:** 14 points
|
99 |
+
- **3rd Place:** 10 points
|
100 |
"""
|
101 |
)
|
102 |
+
|
103 |
with st.expander("Tie-Breakers"):
|
104 |
st.write(
|
|
|
105 |
"In the event of a tie, the following tie-breakers will be applied in order:\n\n"
|
106 |
"1. Highest Evaluation Challenge score\n"
|
107 |
"2. Highest Sampling Challenge score\n"
|
108 |
+
"3. Highest Compression Challenge score"
|
109 |
)
|
110 |
+
|
111 |
st.write(
|
112 |
+
"The overall leaderboard, which shows the total points across all challenges, will go live on **March 10th**. "
|
113 |
+
"Each challenge—Compression, Sampling, and Evaluation—will also have its own leaderboard on their respective Hugging Face submission servers."
|
|
|
114 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|