-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathindex.html
365 lines (318 loc) · 16.1 KB
/
index.html
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
<!doctype html>
<html lang="en">
<head>
<head>
<script type="text/javascript">
(function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
(i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
})(window,document,'script','//www.google-analytics.com/analytics.js','ga');
ga('create', 'UA-8024377-10', 'auto');
ga('create', 'UA-25750945-3', 'auto', 'jesseTracker');
ga('send', 'pageview');
ga('jesseTracker.send', 'pageview');
</script>
<script src="https://ajax.googleapis.com/ajax/libs/jquery/3.4.1/jquery.min.js"></script>
<meta charset="utf-8">
<meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
<meta name="author" content="Mark Otto, Jacob Thornton, and Bootstrap contributors">
<meta name="generator" content="Jekyll v3.8.5">
<title>ALFRED -- A Benchmark for Interpreting Grounded Instructions for Everyday Tasks</title>
<link rel="canonical" href="http://askforalfred.com">
<!-- Bootstrap core CSS -->
<link rel="stylesheet" href="https://stackpath.bootstrapcdn.com/bootstrap/4.2.1/css/bootstrap.min.css" integrity="sha384-GJzZqFGwb1QTTN6wy59ffF1BuGJpLSa9DkKMp0DgiMDm4iYMj70gZWKYbI706tWS" crossorigin="anonymous">
<link rel="stylesheet" href="index.css">
<meta http-equiv="x-ua-compatible" content="ie=edge">
<meta name="viewport" content="width=device-width, minimum-scale=1.0">
<meta name="twitter:title" content="ALFRED">
<meta name="og:title" content="ALFRED">
<meta name="description" content="A Benchmark for Interpreting Grounded Instructions for Everyday Tasks">
<meta name="twitter:description" content="A Benchmark for Interpreting Grounded Instructions for Everyday Tasks">
<meta property="og:description" content="A Benchmark for Interpreting Grounded Instructions for Everyday Tasks">
<meta property="og:image" content="https://askforalfred.com/images/alfred_bg.jpg">
<meta name="twitter:image" content="https://askforalfred.com/images/alfred_bg.jpg">
<meta name="twitter:card" content="summary_large_image">
<meta property="twitter:image:width" content="1200">
<meta property="twitter:image:height" content="630">
<meta property="og:image:width" content="1200">
<meta property="og:image:height" content="630">
<script>
/**
* Function that captures a click on an outbound link in Analytics.
* This function takes a valid URL string as an argument, and uses that URL string
* as the event label. Setting the transport method to 'beacon' lets the hit be sent
* using 'navigator.sendBeacon' in browser that support it.
*/
var captureOutboundLink = function(url) {
ga('send', 'event', 'outbound', 'click', url, {
'transport': 'beacon'
});
ga('jesseTracker.send', 'event', 'outbound', 'click', url, {
'transport': 'beacon'
});
// 'hitCallback': function(){document.location = url;}
//});
return false;
}
</script>
<style>
.bd-placeholder-img {
font-size: 1.125rem;
text-anchor: middle;
-webkit-user-select: none;
-moz-user-select: none;
-ms-user-select: none;
user-select: none;
}
@media (min-width: 768px) {
.bd-placeholder-img-lg {
font-size: 3.5rem;
}
}
</style>
<script>
function findGetParameter(parameterName) {
var result = null,
tmp = [];
var items = location.search.substr(1).split("&");
for (var index = 0; index < items.length; index++) {
tmp = items[index].split("=");
if (tmp[0] === parameterName) result = decodeURIComponent(tmp[1]);
}
return result;
}
// Run the data viewer.
var splits_data = 0;
var training_size = 0;
var val_s_size = 0;
var val_u_size = 0;
var vid = null;
var splits_names;
var splits_sizes;
function load_data() {
$.getJSON('splits.json', function(jd) {
splits_data = jd;
training_size = jd.train.length;
val_s_size = jd.valid_seen.length;
val_u_size = jd.valid_unseen.length;
splits_names = ["train", "valid_seen", "valid_unseen"];
splits_sizes = [training_size, val_s_size, val_u_size];
vid = findGetParameter("vid");
if (vid == null) {
choose_example();
}
view_example();
});
}
function new_random_example() {
captureOutboundLink('random');
choose_example();
view_example();
}
function retrieve_example() {
captureOutboundLink('retrieve');
var raw_str = $('#input_retrieve_example').val();
var ps = raw_str.split(".");
var s;
var i;
var S;
vid = -1;
for (s=0; s < 3; s++) {
S = splits_names[s];
I = splits_sizes[s];
for (i=0; i < I; i++) {
if (splits_data[S][i]["repeat_idx"] == ps[1]) {
if (splits_data[S][i]["task"].localeCompare(ps[0]) == 0) {
vid = (training_size * s) + i;
break;
}
}
}
if (vid > -1) {
break;
}
}
if (vid > -1) {
view_example();
}
else {
$('#warning_retrieve_example').show();
}
}
function choose_example() {
// Choose a random example.
var s = Math.floor((Math.random() * 3));
var S = splits_names[s];
var I = splits_sizes[s];
var i = Math.floor((Math.random() * I));
vid = (training_size * s) + i;
}
function view_example() {
$('#warning_retrieve_example').hide();
var s = Math.floor(vid / training_size);
var i = vid % training_size;
var S = splits_names[s];
var I = splits_sizes[s];
// Show video.
var video = document.getElementById('expert_video');
// video.src = "https://mturk.jessethomason.com/lang_2_plan/2.1.0/" + splits_data[S][i]["task"] + "/video.mp4";
video.src = "https://ai2-vision-alfred-data-explorer.s3-us-west-2.amazonaws.com/" + splits_data[S][i]["task"] + "/video.mp4";
video.playbackRate = 2;
video.defaultPlaybackRate = 2;
video.play();
// Retrieve text from JSON.
var aidx = splits_data[S][i]["repeat_idx"];
var traj_json_url = "https://raw.githubusercontent.com/askforalfred/alfred/master/data/json_2.1.0/" + S + "/" + splits_data[S][i]["task"] + "/traj_data.json";
$.getJSON(traj_json_url, function(jd) {
// Populate high and low level text.
$('#highlevel').html(jd.turk_annotations.anns[aidx].task_desc);
$('#lowlevel').html(jd.turk_annotations.anns[aidx].high_descs.join("<br/>"));
});
// Populate retrieval field with video ID.
$('#input_retrieve_example').val(splits_data[S][i]["task"] + "." + aidx);
// Get plink
var url_whole = window.location.href;
var res = url_whole.split("?");
var url_base = res[0];
$('#plink').html(url_base + "?vid=" + vid);
}
</script>
<!-- Custom styles for this template -->
<link href="https://getbootstrap.com/docs/4.3/examples/jumbotron/jumbotron.css" rel="stylesheet">
<script src="https://maxcdn.bootstrapcdn.com/bootstrap/4.0.0/js/bootstrap.min.js" integrity="sha384-JZR6Spejh4U02d8jOt6vLEHfe/JQGiRRSQQxSfFWpi1MquVdAyjUar5+76PVCmYl" crossorigin="anonymous"></script>
</head>
<body onload="load_data()" style="padding-top: 0px;">
<nav class="navbar navbar-expand-lg navbar-dark bg-dark">
<a class="navbar-brand" href="#">ALFRED <img src="images/alfred-white.svg" width=50></a>
<button class="navbar-toggler" type="button" data-toggle="collapse" data-target="#navbars" aria-controls="navbars" aria-expanded="false" aria-label="Toggle navigation">
<span class="navbar-toggler-icon"></span>
</button>
<div class="collapse navbar-collapse" id="navbars">
<div class="navbar-nav">
<a class="nav-item nav-link active" href="#">Home <span class="sr-only">(current)</span></a>
<a class="nav-item nav-link" href="https://arxiv.org/abs/1912.01734"
target="_blank" onclick="captureOutboundLink('https://arxiv.org/abs/1912.01734');">Paper</a>
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" data-toggle="dropdown" href="#">Data & Code</a>
<div class="dropdown-menu">
<a class="dropdown-item" href="https://github.com/askforalfred/alfred/tree/master/data" target="_blank">Data</a>
<a class="dropdown-item" href="https://github.com/askforalfred/alfred" target="_blank">Code</a>
<a class="dropdown-item" href="https://allenai.github.io/ai2thor-v2.1.0-documentation/installation" target="_blank">THOR 2.1.0 Docs</a>
</div>
</li>
<li class="nav-item dropdown">
<a class="nav-link dropdown-toggle" data-toggle="dropdown" href="#">Compete</a>
<div class="dropdown-menu">
<a class="dropdown-item" href="https://leaderboard.allenai.org/alfred/submissions/public" target="_blank">Leaderboard</a>
<a class="dropdown-item" href="EAI23">CVPR 2023 Challenge</a>
<a class="dropdown-item" href="EAI22">CVPR 2022 Challenge</a>
<a class="dropdown-item" href="EAI21">CVPR 2021 Challenge</a>
<a class="dropdown-item" href="EVAL">ECCV 2020 Challenge</a>
</div>
</li>
<a class="nav-item nav-link" href="https://alfworld.github.io/" onclick="captureOutboundLink('https://alfworld.github.io/');">ALFWorld</a>
<a class="nav-item nav-link" href="https://teachingalfred.github.io/" onclick="captureOutboundLink('https://teachingalfred.github.io/');">TEACh</a>
</div>
</div>
</nav>
<main role="main">
<!-- Main jumbotron -->
<div class="jumbotron">
<div class="container">
<h1 class="display-3">ALFRED <img style="vertical-align:middle" src="images/alfred.svg" width=110></h1>
<h3>A Benchmark for Interpreting Grounded Instructions for Everyday Tasks</h3>
<h6>
<table>
<tr>
<td width=200><a href="https://mohitshridhar.com/" target="_blank" onclick="captureOutboundLink('https://mohitshridhar.com/');">Mohit Shridhar</a></td>
<td width=200><a href="https://jessethomason.com/" target="_blank" onclick="captureOutboundLink('https://jessethomason.com/');">Jesse Thomason</a></td>
<td width=200><a href="https://homes.cs.washington.edu/~xkcd/" target="_blank" onclick="captureOutboundLink('https://homes.cs.washington.edu/~xkcd/');">Daniel Gordon</a></td>
<td width=200><a href="https://yonatanbisk.com/" target="_blank" onclick="captureOutboundLink('https://yonatanbisk.com/');">Yonatan Bisk</a></td>
</tr>
<tr>
<td><a href="https://allenai.org/team.html" target="_blank" onclick="captureOutboundLink('https://allenai.org/team.html');">Winson Han</a></td>
<td><a href="http://roozbehm.info/" target="_blank" onclick="captureOutboundLink('http://roozbehm.info/');">Roozbeh Mottaghi</a></td>
<td><a href="https://www.cs.washington.edu/people/faculty/lsz" target="_blank" onclick="captureOutboundLink('https://www.cs.washington.edu/people/faculty/lsz');">Luke Zettlemoyer</a></td>
<td><a href="https://homes.cs.washington.edu/~fox/" target="_blank" onclick="captureOutboundLink('https://homes.cs.washington.edu/~fox/');">Dieter Fox</a><br>
</tr></table>
</h6>
<p> <b>ALFRED</b> (<b>A</b>ction <b>L</b>earning <b>F</b>rom <b>R</b>ealistic <b>E</b>nvironments and <b>D</b>irectives), is a new benchmark for learning a mapping from natural language instructions and egocentric vision to sequences of actions for household tasks. Long composition rollouts with non-reversible state changes are among the phenomena we include to shrink the gap between research benchmarks and real-world applications.</p>
<p>
<a class="btn btn-primary btn-lg homeButton" href="https://arxiv.org/abs/1912.01734"
role="button" target="_blank" onclick="captureOutboundLink('https://arxiv.org/abs/1912.01734');">Paper on ArXiv»</a>
<a class="btn btn-primary btn-lg homeButton" href="https://github.com/askforalfred/alfred"
role="button" target="_blank" onclick="captureOutboundLink('https://github.com/askforalfred/alfred');">GitHub»</a>
<a class="btn btn-primary btn-lg homeButton" href="https://ai2thor.allenai.org/demo"
role="button" target="_blank" onclick="captureOutboundLink('https://ai2thor.allenai.org/demo');">Simulator»</a>
<a class="btn btn-danger btn-lg homeButton" href="https://leaderboard.allenai.org/alfred/submissions/public"
role="button" onclick="captureOutboundLink('Leaderboard');">Leaderboard»</a></p>
</p>
<div class="container-fluid">
<div class="row">
<div class="col-sm-6 d-flex justify-content-right">
<iframe width="560" height="315" id="ytVid" src="https://www.youtube.com/embed/1XoRLNmXffo" frameborder="0" allow="accelerometer; autoplay; encrypted-media; gyroscope; picture-in-picture" allowfullscreen></iframe>
</div>
<div class="col-sm-6 d-flex justify-content-left">
<div class="card bg-light">
<div class="card-body">
<p class="card-text">
<code id="bib"><font color="black">
@inproceedings{ALFRED20,<br>
title ={{ALFRED: A Benchmark for Interpreting Grounded <br>
Instructions for Everyday Tasks}},<br>
author={Mohit Shridhar and Jesse Thomason and<br>
Daniel Gordon and Yonatan Bisk and<br>
Winson Han and Roozbeh Mottaghi and<br>
Luke Zettlemoyer and Dieter Fox},<br>
booktitle = {The IEEE Conference on Computer Vision <br>
and Pattern Recognition (CVPR)},<br>
year = {2020},<br>
url = {https://arxiv.org/abs/1912.01734}<br>
}
</font></code>
</p>
</div>
</div>
</div>
</div>
</div>
</main>
<div class="container">
<center>
<h2>Data Explorer</h2>
<table>
<tr><td>
<div>
<button class="btn btn-info btn-md" onclick="new_random_example()">Show Random Example</button>
<br/><br/>
<button class="btn btn-info btn-md" onclick="retrieve_example()">Retrieve Example</button>
<input width="100%" id="input_retrieve_example">
<div class="alert alert-danger" role="alert" id="warning_retrieve_example">Could not parse the specified example name.</div>
<table class="table table-striped">
<tr><td colspan=2>
<center><video width="320" height="240" controls id="expert_video" type="video/mp4">
Your browser does not support the video tag.
</video></center>
</td></tr>
<tr><td><b>Goal Instruction</b></td><td id="highlevel"></td></tr>
<tr><td><b>Step-by-Step Instructions</b></td><td id="lowlevel"></td></tr>
<tr><td><b>Permanent Link</b></td><td id="plink"></td></tr>
</table>
</div>
</td></tr>
</table>
</center>
<hr>
</div> <!-- /container -->
<footer class="container">
<div id="groupContainer">
<img src="images/UW.jpg" class="groupLogo">
<img src="images/cmu.jpg" class="groupLogo">
<img src="images/AI2.png" class="groupLogo">
<img src="images/nvidia.jpg" class="groupLogo">
</div>
<br>
<p>Questions or issues? Contact <a href="mailto:[email protected]">[email protected]</a></p>
</footer>
</body>
</html>