madmax3366 commited on
Commit
2a9cc3f
·
verified ·
1 Parent(s): 9b4a15e

Update index.html

Browse files
Files changed (1) hide show
  1. index.html +207 -187
index.html CHANGED
@@ -1,217 +1,237 @@
1
  <!DOCTYPE html>
2
- <html lang="en">
3
  <head>
4
- <meta charset="utf-8" />
5
- <meta name="viewport" content="width=device-width, initial-scale=1" />
 
 
 
6
  <title>AUTOMOTIVE-ENV: Benchmarking Multimodal Agents in Vehicle Interface Systems</title>
7
- <meta name="description" content="AUTOMOTIVE-ENV: Benchmarking Multimodal Agents in Vehicle Interface Systems" />
8
 
9
- <link rel="preconnect" href="https://fonts.googleapis.com">
10
- <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
11
- <link href="https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700&display=swap" rel="stylesheet">
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
 
13
  <style>
14
- :root{
15
- --page-w: 1100px;
16
- --fg: #0b0b0b;
17
- --bg: #ffffff;
18
- --muted: #555;
19
- --border: #e7e7ea;
20
- --accent: #111;
21
- --accent-weak: rgba(0,0,0,.08);
22
- --shadow: 0 1px 2px rgba(0,0,0,.05), 0 6px 22px rgba(0,0,0,.06);
23
- --radius: 12px;
24
- }
25
- *{box-sizing:border-box}
26
- html,body{margin:0;padding:0;background:var(--bg);color:var(--fg);font-family:Inter,system-ui,-apple-system,Segoe UI,Roboto,Helvetica,Arial}
27
- a{color:var(--accent);text-decoration:none;border-bottom:1px solid var(--accent-weak)}
28
- a:hover{border-bottom-color:rgba(0,0,0,.28)}
29
- .container{max-width:var(--page-w);margin:0 auto;padding:0 20px}
30
-
31
- /* Minimal top nav (centered like many paper pages) */
32
- .nav{border-bottom:1px solid var(--border);background:#fff}
33
- .nav-inner{display:flex;align-items:center;justify-content:center;gap:20px;height:54px}
34
- .nav a{border-bottom:0;font-weight:600;color:#222}
35
-
36
- /* Hero / header */
37
- header.hero{padding:48px 0 28px;border-bottom:1px solid var(--border)}
38
- h1.title{font-size:clamp(28px,4.2vw,46px);line-height:1.12;margin:0 0 10px;letter-spacing:-0.02em;text-align:center}
39
- .authors,.affils{color:var(--muted);text-align:center}
40
- .authors{margin:6px auto 0;font-size:15px}
41
- .affils{margin:2px auto 0;font-size:14px}
42
- .lead{max-width:900px;margin:14px auto 0;text-align:center;color:var(--muted);font-size:clamp(16px,2vw,18px)}
43
-
44
- /* Link badges (Paper / Code) */
45
- .links{display:flex;gap:12px;justify-content:center;margin-top:18px}
46
- .badge{display:inline-flex;align-items:center;gap:8px;padding:10px 14px;border:1px solid var(--border);border-radius:999px;background:#fff;box-shadow:var(--shadow);font-size:14px}
47
- .badge span.icon{font-weight:700;font-size:14px}
48
-
49
- /* Sections in paper style */
50
- section{padding:34px 0;border-bottom:1px solid var(--border)}
51
- section:last-of-type{border-bottom:0}
52
- h2{font-size:22px;margin:0 0 14px}
53
- p{margin:10px 0}
54
-
55
- /* Figure (image above video) with zoom */
56
- .figure{margin-top:6px}
57
- .figure img{
58
- width:100%;height:auto;display:block;
59
- max-height:72vh;object-fit:contain;
60
- border:1px solid var(--border);border-radius:var(--radius);
61
- background:#fff;
62
- }
63
- .caption{font-size:14px;color:var(--muted);text-align:center;margin-top:8px}
64
-
65
- /* CSS-only lightbox */
66
- .lightbox{position:fixed;inset:0;display:none;align-items:center;justify-content:center;background:rgba(0,0,0,.92);padding:24px;z-index:999}
67
- .lightbox:target{display:flex}
68
- .lightbox img{max-width:96vw;max-height:96vh}
69
-
70
- /* Video */
71
- .video video, .video iframe{width:100%;height:auto;display:block;border-radius:var(--radius);background:#000;border:1px solid var(--border)}
72
-
73
- /* Grid for “Tasks (preview)” */
74
- .grid{display:grid;gap:18px}
75
- @media (min-width: 880px){ .grid.two{grid-template-columns:1fr 1fr} }
76
-
77
- /* Code block (BibTeX) */
78
- pre{background:#fafafa;border:1px solid var(--border);border-radius:10px;padding:14px;overflow:auto}
79
- code{font-family:ui-monospace,SFMono-Regular,Menlo,Consolas,monospace;font-size:13px}
80
-
81
- /* Footer */
82
- footer{padding:26px 0;color:var(--muted);text-align:center;font-size:14px}
83
  </style>
84
  </head>
85
-
86
  <body>
87
- <!-- minimal top nav (optional) -->
88
- <nav class="nav">
89
- <div class="container nav-inner">
90
- <a href="#">AUTOMOTIVE-ENV</a>
91
- <a href="https://arxiv.org/abs/2509.21143" target="_blank" rel="noopener">Paper</a>
92
- <a href="#" target="_blank" rel="noopener">Code</a>
93
- </div>
94
- </nav>
95
-
96
- <!-- hero -->
97
- <header class="hero">
98
- <div class="container">
99
- <h1 class="title">AUTOMOTIVE-ENV: BENCHMARKING MULTIMODAL AGENTS IN VEHICLE INTERFACE SYSTEMS</h1>
100
-
101
- <div class="authors">
102
- <strong>Junfeng Yan</strong><sup>*1</sup>,
103
- <strong>Biao Wu</strong><sup>*1</sup>,
104
- <strong>Meng Fang</strong><sup>2</sup>,
105
- <strong>Ling Chen</strong><sup>1</sup>
106
- </div>
107
- <div class="affils">
108
- <sup>1</sup>Australian Artificial Intelligence Institute, Sydney, Australia &nbsp;&nbsp;|&nbsp;&nbsp;
109
- <sup>2</sup>University of Liverpool, Liverpool, United Kingdom
110
- </div>
111
 
112
- <p class="lead">
113
- Multimodal agents show strong generic GUI skills, but in-vehicle systems impose unique constraints: limited driver attention, strict safety, and location-aware interaction. <em>Automotive-ENV</em> is a high-fidelity benchmark for vehicle GUIs with 185 parameterized tasks and reproducible checks. We further propose <em>ASURADA</em>, a geo-aware agent leveraging GPS context for safer decisions.
114
- </p>
115
-
116
- <div class="links">
117
- <a class="badge" href="https://arxiv.org/abs/2509.21143" target="_blank" rel="noopener">
118
- <span class="icon">⧉</span><span>Paper (arXiv)</span>
119
- </a>
120
- <a class="badge" href="#" target="_blank" rel="noopener">
121
- <span class="icon">★</span><span>Code (coming soon)</span>
122
- </a>
123
- </div>
 
 
 
 
124
  </div>
125
- </header>
126
-
127
- <!-- system overview image (click to zoom) -->
128
- <section aria-label="system-overview">
129
- <div class="container">
130
- <h2>System Overview</h2>
131
- <div class="figure">
132
- <!-- Put your image next to index.html as demo_arch.jpg (or change the src) -->
133
- <a href="#fig-arch"><img src="demo_arch.jpg" alt="Automotive-ENV architecture overview"></a>
134
- <p class="caption">Figure 1. Automotive-ENV architecture overview. Click to zoom.</p>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
135
  </div>
136
  </div>
137
- </section>
138
-
139
- <!-- teaser / demo video -->
140
- <section aria-label="demo">
141
- <div class="container">
142
- <h2>Demo</h2>
143
- <!-- Place demo.mp4 next to this index.html -->
144
- <div class="video">
145
- <video src="demo.mp4" autoplay muted loop playsinline controls></video>
 
 
 
 
146
  </div>
147
  </div>
148
- </section>
149
-
150
- <!-- abstract -->
151
- <section aria-label="abstract">
152
- <div class="container">
153
- <h2>Abstract</h2>
154
- <p>
155
- In-vehicle GUIs present distinct challenges: drivers’ limited attention, strict safety requirements, and
156
- complex location-based interaction patterns. We introduce <strong>Automotive-ENV</strong>, a high-fidelity benchmark and
157
- interaction environment tailored for vehicle GUIs. The platform defines <strong>185 parameterized tasks</strong> spanning
158
- explicit control, implicit intent understanding, and safety-aware tasks, and provides structured multimodal
159
- observations with precise programmatic checks for reproducible evaluation.
160
- </p>
161
- <p>
162
- Building on this benchmark, we propose <strong>ASURADA</strong>, a geo-aware multimodal agent that integrates GPS-informed
163
- context to adapt actions by location, environment, and regional norms. Experiments show geo-awareness
164
- significantly improves safety-aware task success. We will release Automotive-ENV, with tasks and tooling, to
165
- advance safe and adaptive in-vehicle agents.
166
- </p>
167
  </div>
168
- </section>
169
-
170
- <!-- tasks preview (reserved area you can expand later) -->
171
- <section aria-label="tasks">
172
- <div class="container">
173
- <h2>Tasks (preview)</h2>
174
- <div class="grid two">
175
- <div>
176
- <h3>Explicit Control</h3>
177
- <p>Deterministic UI manipulations under constraints (climate, media, navigation, connectivity).</p>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
178
  </div>
179
- <div>
180
- <h3>Implicit Intent</h3>
181
- <p>Goal inference from short user context with preference awareness and minimal steps.</p>
182
- </div>
183
- <div>
184
- <h3>Safety-Aware</h3>
185
- <p>Sensor + context classification (danger vs. do-nothing) with strict action gating and escalation logic.</p>
186
- </div>
187
- <div>
188
- <h3>Evaluation</h3>
189
- <p>Programmatic checks, success/failure traces, generalization splits, and ablations.</p>
 
 
 
 
 
 
 
 
 
190
  </div>
191
  </div>
192
  </div>
193
- </section>
 
194
 
195
- <!-- citation -->
196
- <section aria-label="citation">
197
- <div class="container">
198
- <h2>Citation</h2>
199
- <pre><code>@article{yan2025automotive_env,
200
  title = {AUTOMOTIVE-ENV: Benchmarking Multimodal Agents in Vehicle Interface Systems},
201
  author = {Yan, Junfeng and Wu, Biao and Fang, Meng and Chen, Ling},
202
  journal = {arXiv preprint arXiv:2509.21143},
203
  year = {2025}
204
  }</code></pre>
 
 
 
 
 
 
 
 
 
 
 
 
205
  </div>
206
- </section>
207
-
208
- <footer>
209
- © 2025 automotive-env hosted on GitHub Pages
210
- </footer>
 
 
 
 
 
211
 
212
- <!-- Lightbox target (click anywhere to close) -->
213
- <a id="fig-arch" class="lightbox" href="#">
214
- <img src="demo_arch.jpg" alt="Automotive-ENV architecture overview (full size)">
215
- </a>
216
  </body>
217
  </html>
 
1
  <!DOCTYPE html>
2
+ <html>
3
  <head>
4
+ <meta charset="utf-8">
5
+ <meta name="description"
6
+ content="AUTOMOTIVE-ENV: Benchmarking Multimodal Agents in Vehicle Interface Systems. A high-fidelity benchmark and environment for in-vehicle GUIs with 185 parameterized tasks and reproducible checks.">
7
+ <meta name="keywords" content="Automotive-ENV, multimodal agents, vehicle GUI, benchmark, ASURADA">
8
+ <meta name="viewport" content="width=device-width, initial-scale=1">
9
  <title>AUTOMOTIVE-ENV: Benchmarking Multimodal Agents in Vehicle Interface Systems</title>
 
10
 
11
+ <!-- Optional: remove if you don't use GA -->
12
+ <script async src="https://www.googletagmanager.com/gtag/js?id=G-PYVRSFMDRL"></script>
13
+ <script>
14
+ window.dataLayer = window.dataLayer || [];
15
+ function gtag(){ dataLayer.push(arguments); }
16
+ gtag('js', new Date());
17
+ gtag('config', 'G-PYVRSFMDRL');
18
+ </script>
19
+
20
+ <link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro" rel="stylesheet">
21
+
22
+ <!-- All local files in the repo root -->
23
+ <link rel="stylesheet" href="bulma.min.css">
24
+ <link rel="stylesheet" href="bulma-carousel.min.css">
25
+ <link rel="stylesheet" href="bulma-slider.min.css">
26
+ <link rel="stylesheet" href="fontawesome.all.min.css">
27
+ <link rel="stylesheet" href="index.css">
28
+ <link rel="icon" href="favicon.svg">
29
+
30
+ <script defer src="fontawesome.all.min.js"></script>
31
+ <script src="bulma-carousel.min.js"></script>
32
+ <script src="bulma-slider.min.js"></script>
33
+ <script src="index.js"></script>
34
 
35
  <style>
36
+ body { background: #ffffff; color: #111; }
37
+ .hero { background: #fff; }
38
+ .publication-title { letter-spacing: -0.02em; }
39
+ .publication-links .button { margin: 0 6px 8px; }
40
+ .system-figure img { max-width: 100%; height: auto; border: 1px solid #eee; border-radius: 6px; }
41
+ .subtitle { color: #444; }
42
+ .footer { background: #fafafa; }
43
+ section, .hero, .navbar { border-bottom: 0 !important; }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
44
  </style>
45
  </head>
 
46
  <body>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
47
 
48
+ <nav class="navbar" role="navigation" aria-label="main navigation">
49
+ <div class="navbar-brand">
50
+ <a role="button" class="navbar-burger" aria-label="menu" aria-expanded="false">
51
+ <span aria-hidden="true"></span>
52
+ <span aria-hidden="true"></span>
53
+ <span aria-hidden="true"></span>
54
+ </a>
55
+ </div>
56
+ <div class="navbar-menu">
57
+ <div class="navbar-start" style="flex-grow: 1; justify-content: center;">
58
+ <a class="navbar-item" href="https://github.com/automotive-env/AutmotiveEnv.github.io" target="_blank" rel="noopener">
59
+ <span class="icon"><i class="fab fa-github"></i></span>
60
+ </a>
61
+ <a class="navbar-item" href="https://arxiv.org/abs/2509.21143" target="_blank" rel="noopener">
62
+ <span class="icon"><i class="ai ai-arxiv"></i></span>
63
+ </a>
64
  </div>
65
+ </div>
66
+ </nav>
67
+
68
+ <section class="hero">
69
+ <div class="hero-body">
70
+ <div class="container is-max-desktop">
71
+ <div class="columns is-centered">
72
+ <div class="column has-text-centered">
73
+
74
+ <h1 class="title is-1 publication-title">AUTOMOTIVE-ENV: Benchmarking Multimodal Agents in Vehicle Interface Systems</h1>
75
+
76
+ <div class="is-size-5 publication-authors">
77
+ <span class="author-block"><strong>Junfeng Yan</strong><sup>*1</sup>,</span>
78
+ <span class="author-block"><strong>Biao Wu</strong><sup>*1</sup>,</span>
79
+ <span class="author-block"><strong>Meng Fang</strong><sup>2</sup>,</span>
80
+ <span class="author-block"><strong>Ling Chen</strong><sup>1</sup></span>
81
+ </div>
82
+
83
+ <div class="is-size-6 publication-authors" style="margin-top:6px;">
84
+ <span class="author-block"><sup>1</sup>Australian Artificial Intelligence Institute, Sydney, Australia</span><br>
85
+ <span class="author-block"><sup>2</sup>University of Liverpool, Liverpool, United Kingdom</span>
86
+ </div>
87
+
88
+ <div class="column has-text-centered" style="margin-top:16px;">
89
+ <div class="publication-links">
90
+ <span class="link-block">
91
+ <a href="https://arxiv.org/abs/2509.21143"
92
+ class="external-link button is-normal is-rounded is-dark" target="_blank" rel="noopener">
93
+ <span class="icon"><i class="ai ai-arxiv"></i></span>
94
+ <span>Paper</span>
95
+ </a>
96
+ </span>
97
+ <span class="link-block">
98
+ <a href="https://github.com/automotive-env/AutmotiveEnv.github.io"
99
+ class="external-link button is-normal is-rounded is-dark" target="_blank" rel="noopener">
100
+ <span class="icon"><i class="fab fa-github"></i></span>
101
+ <span>Code (site)</span>
102
+ </a>
103
+ </span>
104
+ <span class="link-block">
105
+ <a href="demo.mp4"
106
+ class="external-link button is-normal is-rounded is-dark" target="_blank" rel="noopener">
107
+ <span class="icon"><i class="fas fa-play"></i></span>
108
+ <span>Demo Video</span>
109
+ </a>
110
+ </span>
111
+ </div>
112
+ </div>
113
+
114
+ </div>
115
  </div>
116
  </div>
117
+ </div>
118
+ </section>
119
+
120
+ <section class="section">
121
+ <div class="container is-max-desktop">
122
+ <div class="columns is-centered">
123
+ <div class="column is-four-fifths">
124
+ <h2 class="title is-3 has-text-centered">System Overview</h2>
125
+ <div class="system-figure has-text-centered">
126
+ <!-- image at repo root -->
127
+ <img src="demo_arch.jpg" alt="Automotive-ENV system architecture overview">
128
+ <p class="subtitle is-6" style="margin-top:8px;">Figure 1. Automotive-ENV architecture overview.</p>
129
+ </div>
130
  </div>
131
  </div>
132
+ </div>
133
+ </section>
134
+
135
+ <section class="hero teaser">
136
+ <div class="container is-max-desktop">
137
+ <div class="hero-body">
138
+ <video id="teaser" autoplay muted loop playsinline height="100%">
139
+ <!-- video at repo root -->
140
+ <source src="demo.mp4" type="video/mp4">
141
+ </video>
142
+ <h2 class="subtitle has-text-centered" style="margin-top:10px;">
143
+ A short looping demo showcasing Automotive-ENV tasks and agent behavior.
144
+ </h2>
 
 
 
 
 
 
145
  </div>
146
+ </div>
147
+ </section>
148
+
149
+ <section class="section">
150
+ <div class="container is-max-desktop">
151
+ <div class="columns is-centered has-text-centered">
152
+ <div class="column is-four-fifths">
153
+ <h2 class="title is-3">Abstract</h2>
154
+ <div class="content has-text-justified">
155
+ <p>
156
+ Multimodal agents have demonstrated strong performance in general GUI interactions, but their
157
+ application in automotive systems has been largely unexplored. In-vehicle GUIs present distinct
158
+ challenges: drivers’ limited attention, strict safety requirements, and complex location-based
159
+ interaction patterns. To address these challenges, we introduce <strong>Automotive-ENV</strong>,
160
+ the first high-fidelity benchmark and interaction environment tailored for vehicle GUIs.
161
+ </p>
162
+ <p>
163
+ This platform defines <strong>185 parameterized tasks</strong> spanning explicit control,
164
+ implicit intent understanding, and safety-aware tasks, and provides structured multimodal
165
+ observations with precise programmatic checks for reproducible evaluation. Building on this
166
+ benchmark, we propose <strong>ASURADA</strong>, a geo-aware multimodal agent that integrates
167
+ GPS-informed context to dynamically adjust actions based on location, environmental conditions,
168
+ and regional driving norms.
169
+ </p>
170
+ <p>
171
+ Experiments show that geo-aware information significantly improves success on safety-aware tasks,
172
+ highlighting the importance of location-based context in automotive environments. We will release
173
+ Automotive-ENV, complete with all tasks and benchmarking tools, to further the development of
174
+ safe and adaptive in-vehicle agents.
175
+ </p>
176
  </div>
177
+ </div>
178
+ </div>
179
+ </div>
180
+ </section>
181
+
182
+ <section class="section">
183
+ <div class="container is-max-desktop">
184
+ <div class="columns is-centered">
185
+ <div class="column is-full-width">
186
+ <h2 class="title is-3">Tasks (Preview)</h2>
187
+ <div class="content has-text-justified">
188
+ <p>
189
+ Automotive-ENV groups tasks into three categories with programmatic success criteria:
190
+ </p>
191
+ <ul>
192
+ <li><strong>Explicit Control</strong>: climate, media, navigation, connectivity.</li>
193
+ <li><strong>Implicit Intent</strong>: infer user goals from short context; minimize UI steps.</li>
194
+ <li><strong>Safety-Aware</strong>: sensor + context classification with strict action gating.</li>
195
+ </ul>
196
+ <p>Per-task thumbnails and clips will be added in future updates.</p>
197
  </div>
198
  </div>
199
  </div>
200
+ </div>
201
+ </section>
202
 
203
+ <section class="section" id="BibTeX">
204
+ <div class="container is-max-desktop content">
205
+ <h2 class="title">BibTeX</h2>
206
+ <pre><code>@article{yan2025automotive_env,
 
207
  title = {AUTOMOTIVE-ENV: Benchmarking Multimodal Agents in Vehicle Interface Systems},
208
  author = {Yan, Junfeng and Wu, Biao and Fang, Meng and Chen, Ling},
209
  journal = {arXiv preprint arXiv:2509.21143},
210
  year = {2025}
211
  }</code></pre>
212
+ </div>
213
+ </section>
214
+
215
+ <footer class="footer">
216
+ <div class="container">
217
+ <div class="content has-text-centered">
218
+ <a class="icon-link" href="https://arxiv.org/abs/2509.21143" target="_blank" rel="noopener">
219
+ <i class="ai ai-arxiv"></i>
220
+ </a>
221
+ <a class="icon-link" href="https://github.com/automotive-env/AutmotiveEnv.github.io" target="_blank" rel="noopener">
222
+ <i class="fab fa-github"></i>
223
+ </a>
224
  </div>
225
+ <div class="columns is-centered">
226
+ <div class="column is-8">
227
+ <div class="content has-text-centered">
228
+ <p>This website reuses the open-source Nerfies/OS-World page framework. Remove analytics if not used.</p>
229
+ <p>© 2025 automotive-env — Hosted on GitHub Pages.</p>
230
+ </div>
231
+ </div>
232
+ </div>
233
+ </div>
234
+ </footer>
235
 
 
 
 
 
236
  </body>
237
  </html>