-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathindex.html
397 lines (331 loc) · 18.2 KB
/
index.html
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
<!DOCTYPE html>
<html lang="en">
<head>
<title>MIntRec</title>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1">
<!-- CSS IMPORTS -->
<link rel="stylesheet" href="static/styles/index.css"> <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css"> <link rel="stylesheet" media="screen" href="https://fontlibrary.org/face/hk-grotesk" type="text/css"/>
<!-- <link rel="icon" href="static/images/favicon.png"> 标题logo-->
<link rel="stylesheet" href="https://use.fontawesome.com/releases/v5.1.1/css/all.css" integrity="sha384-O8whS3fhG2OnA5Kas0Y9l3cfpmYjapjI0E4theH4iuMD+pLhbf6JI0jIMfYcK3yZ" crossorigin="anonymous">
<link href="https://afeld.github.io/emoji-css/emoji.css" rel="stylesheet">
<link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
<link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap-theme.min.css" integrity="sha384-rHyoN1iRsVXV4nD0JutlnGaslCJuC7uwjduW9SVrLvRYooPp2bWYgmgJQIXwl/Sp" crossorigin="anonymous">
<!-- JS IMPORTS -->
<script src="https://code.jquery.com/jquery-2.2.4.min.js" integrity="sha256-BbhdlvQf/xTY9gja0Dq3HiwQF8LaCRTXxZKRutelT44=" crossorigin="anonymous"></script>
<script src="https://cdnjs.cloudflare.com/ajax/libs/mustache.js/2.3.0/mustache.min.js" integrity="sha256-iaqfO5ue0VbSGcEiQn+OeXxnxAMK2+QgHXIDA5bWtGI=" crossorigin="anonymous"></script>
<script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/[email protected]/font/bootstrap-icons.css">
<script src="https://cdnjs.cloudflare.com/ajax/libs/moment.js/2.17.1/moment.min.js" integrity="sha256-Gn7MUQono8LUxTfRA0WZzJgTua52Udm1Ifrk5421zkA=" crossorigin="anonymous"></script>
<script src="https://apps.bdimg.com/libs/jquery/2.1.4/jquery.min.js"></script>
<!-- 新 Bootstrap 核心 CSS 文件 -->
<link href="https://cdn.staticfile.org/twitter-bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet">
<!-- jQuery文件。务必在bootstrap.min.js 之前引入 -->
<script src="https://cdn.staticfile.org/jquery/2.1.1/jquery.min.js"></script>
<!-- 最新的 Bootstrap 核心 JavaScript 文件 -->
<script src="https://cdn.staticfile.org/twitter-bootstrap/3.3.7/js/bootstrap.min.js"></script>
<!-- 引入 layui.css -->
<link rel="stylesheet" href="//unpkg.com/[email protected]/dist/css/layui.css">
<!-- 引入 layui.js -->
<script src="//unpkg.com/[email protected]/dist/layui.js"> </script>
<!-- 引入 layui.css -->
<link href="//unpkg.com/[email protected]/dist/css/layui.css" rel="stylesheet">
<!-- 引入 layui.js -->
<script src="//unpkg.com/[email protected]/dist/layui.js"></script>
<script async src="//busuanzi.ibruce.info/busuanzi/2.3/busuanzi.pure.mini.js">
</script>
</head>
<div hidden="hidden">
本站总访问量<span id="busuanzi_value_site_pv"></span>次
本站访客数<span id="busuanzi_value_site_uv"></span>人次
本文总阅读量<span id="busuanzi_value_page_pv"></span>次
</div>
<style>
.layui-nav .layui-this:after, .layui-nav-bar{
background-color: white;
}
.layui-nav{
background-color: #4371C6;
}
p.rank{
padding-left:30px;
}
body {
font-family: 'HankenGroteskRegular';
background-color:white;
}
</style>
<body>
<script>
function raw_data(){
window.location.href="raw_data.html"
}
function Features(){
window.location.href="Features_1.html"
}
function Fork_On_Github(){
window.location.href="Fork_On_Github.html"
}
</script>
<ul class="layui-nav" lay-filter="">
<li lay-unselect class="layui-nav-item layui-this"><a href="index.html">Home</a></li>
<li lay-unselect class="layui-nav-item"><a href="leaderboard.html">Leaderboard</a></li>
</ul>
<script>
//注意:导航 依赖 element 模块,否则无法进行功能性操作
layui.use('element', function(){
var element = layui.element;
//…
});
</script>
<div class="container">
<div class="row">
<div class="col-md-3 box " style="position:fixed">
<h3 style="font-weight: 600; line-height: 1.3">MIntRec: Multimodal Intent Recognition </h3>
<br>
<p style='margin: 0 0 10px; color:#595959; font-weight: 400;font:18px/1.5 -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, Oxygen, Ubuntu, Cantarell, "Fira Sans", "Droid Sans", "Helvetica Neue", Arial, sans-serif, "Apple Color Emoji", "Segoe UI Emoji", "Segoe UI Symbol";'>
A New Dataset for Multimodal Intent Recognition</p>
<hr>
<br>
<div style="margin-top: 20rpx; position: relative;height: 20rpx ;">
<a style="color: #39c; " href="https://github.com/thuiar/MIntRec">View the Project on GitHub</a>
</div>
<br>
<div style="margin-top: 20rpx;">
<a style="color: #39c;" href="https://dl.acm.org/doi/10.1145/3503161.3547906">Download the paper</a>
</div>
<br>
<br>
<center>
<style>
#my_button_left.btn-default{
border-top-left-radius:5px !important;
border-bottom-left-radius: 5px !important;
}
#my_button_right.btn-default{
border-top-right-radius:5px !important;
border-bottom-right-radius: 5px !important;
}
</style>
<div class="" role="group" >
<button id='my_button_left' onclick="raw_data()" type="button" class="btn btn-default col-md-4 ">
<!-- style="background-color: #999"; -->
<!-- href="https://drive.google.com/drive/folders/18iLqmUYDDOwIiiRbgwLpzw76BD62PK0p" -->
<p style=' color:#595959; font-weight: 400;font:15px -apple-system'>
Download
</p>
<strong >Raw Data</strong>
</button>
<button onclick="Features()" type="button" class="btn btn-default col-md-4" >
<!-- <a href="https://drive.google.com/drive/folders/18iLqmUYDDOwIiiRbgwLpzw76BD62PK0p"> -->
<p style=' color:#595959; font-weight: 400;font:15px -apple-system'>
Download
</p>
<strong> Features </strong>
</button>
<button id='my_button_right' onclick="Fork_On_Github()" type="button" class="btn btn-default col-md-4">
<!-- <a href="https://github.com/thuiar/MIntRec"> -->
<p style=' color:#595959; font-weight: 400;font:15px -apple-system'>
Fork On
</p>
<strong>Github </strong>
</button>
</div>
</center>
</div>
<div class="col-md-7 box layui-col-md-offset5" >
<div id="container" style="width: 100%"></div>
<script id="template" type="x-tmpl-mustache">
<p style='text-align:justify;margin: 0 0 10px; color:#595959; font-weight: 400;font:18px/1.5 -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, Oxygen, Ubuntu, Cantarell, "Fira Sans", "Droid Sans", "Helvetica Neue", Arial, sans-serif, "Apple Color Emoji", "Segoe UI Emoji", "Segoe UI Symbol";'>
Multimodal intent recognition is a significant task for understanding human language in real-world multimodal scenes. Most existing
intent recognition methods have limitations in leveraging the multimodal information due to the restrictions of the benchmark datasets
with only text information.
It formulates coarse-grained and fine-grained intent taxonomies
based on the data collected from the TV series Superstore. The
dataset consists of 2,224 high-quality samples with text, video, and
audio modalities and has multimodal annotations among twenty intent categories. Furthermore, we provide annotated bounding boxes
of speakers in each video segment and achieve an automatic process
for speaker annotation. MIntRec is helpful for researchers to mine
relationships between different modalities to enhance the capability of intent recognition. We extract features from each modality
and model cross-modal interactions by adapting three powerful
multimodal fusion methods to build baselines. The gap between the best-performing methods and humans indicates the challenge and importance of this task
for the community.
</p>
</script>
<br>
<!-- <div class="">
<strong>Example of multimodal intent recognition</strong>
<img src="static/images/exmpale.png" >
</div> -->
<br>
<strong>Statistics of the MIntRec dataset</strong>
<br>
<table class="layui-table">
<colgroup>
<col width="300">
<col width="100">
<col>
</colgroup>
<thead>
</thead>
<tbody>
<tr>
<td>Total number of coarse-grained intents</td>
<td>2</td>
</tr>
<tr>
<td>Total number of fine-grained intents</td>
<td>20</td>
</tr>
<tr>
<td>Total number of videos</td>
<td>43</td>
</tr>
<tr>
<td>Total number of video segments</td>
<td>2,224</td>
</tr>
<tr>
<td>Total number of words in text utterances</td>
<td> 15,658</td>
</tr>
<tr>
<td>Total number of unique words in text utterances</td>
<td> 2,562</td>
</tr>
<tr>
<td>Average length of text utterances</td>
<td> 7.04</td>
</tr>
<tr>
<td>Maximum length of text utterances</td>
<td> 26</td>
</tr>
<tr>
<td>Average length of video segments (s)</td>
<td>2.38</td>
</tr>
<tr>
<td>Maximum length of video segments (s)</td>
<td>9.59</td>
</tr>
</tbody>
</table>
<style>
#mytable tbody td{
font-weight: 300;
border-right-style:none;
border-left-style:none;
border-top-style: none;
}
#mytable thead td{
font-size: 15;
font-weight: 600;
background-color: #4371C6;
color: white;
border-right-style:none;
border-left-style:none;
border-top-style: none;
}
#best td{
font-weight: 800 !important
}
</style>
<br>
<br>
<h4 style="font-weight: 600; line-height: 1.3">
Intent taxonomies of our MIntRec dataset with brief interpretations.
</h4>
<br>
<img src="static/images/table.png" width=100%>
<br>
<br>
<h4 style="font-weight: 600; line-height: 1.3">
Voting statistics of 2,224 samples in MIntRec.
</h4>
<br>
<img src="static/images/line.png" width=100%>
<br>
<br>
<br>
<h4 style="font-weight: 600; line-height: 1.3">Citation </h4>
<br>
<p style='text-align:justify;margin: 0 0 10px; color:#595959; font-weight: 400;font:18px/1.5 -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, Oxygen, Ubuntu, Cantarell, "Fira Sans", "Droid Sans", "Helvetica Neue", Arial, sans-serif, "Apple Color Emoji", "Segoe UI Emoji", "Segoe UI Symbol";'>
Please cite the following papers if you use this dataset in your work.
</p>
<br>
<style>
#my_pre {
padding: 8px 15px;
background: #f8f8f8;
border-radius: 5px;
border: 1px solid #e5e5e5;
overflow-x: auto !important;
font-weight: 500 !important; font:15px/1.5 -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, Oxygen, Ubuntu, Cantarell, "Fira Sans", "Droid Sans", "Helvetica Neue", Arial, sans-serif, "Apple Color Emoji", "Segoe UI Emoji", "Segoe UI Symbol";
}
</style>
<pre id='my_pre'>
@inproceedings{10.1145/3503161.3547906,
author = {Zhang, Hanlei and Xu, Hua and Wang, Xin and Zhou, Qianrui and Zhao, Shaojie and Teng, Jiayan},
title = {MIntRec: A New Dataset for Multimodal Intent Recognition},
year = {2022},
doi = {10.1145/3503161.3547906},
booktitle = {Proceedings of the 30th ACM International Conference on Multimedia},
pages = {1688–1697},
numpages = {10}
}
</pre>
</div>
</div>
</div>
<script>
window.addEventListener('load',function(){
$.getJSON("count.json", function(data) {
console.log(data);})
})
</script>
<br>
<br>
<br>
<br>
<br>
</body>
</html>
<script type="text/javascript">
(function($) {
var LEADERBOARD_JSON = 'https://hucvl.github.io/recipeqa/leaderboard.json';
var template = $('#template').html();
Mustache.parse(template);
var test = [];
var submissions = [];
var ms_data = {
submissions:[],
};
$.getJSON(LEADERBOARD_JSON).done(function (data) {
for (var i = 0; i < data.leaderboard.length; i++) {
if(data.leaderboard[i].scores.textual_cloze != null || data.leaderboard[i].scores.visual_cloze != null ||
data.leaderboard[i].scores.visual_coherence != null || data.leaderboard[i].scores.visual_ordering != null){
test.push(data.leaderboard[i])
}
}
for (var i = 0; i < test.length; i++){
ms_data['submissions'].push(test[i])
var item = test[i];
item.rank = i + 1;
item.scores['textual_cloze']=parseFloat(item.scores['textual_cloze']).toFixed(3)
item.scores['visual_coherence']=parseFloat(item.scores['visual_coherence']).toFixed(3)
item.scores['visual_cloze']=parseFloat(item.scores['visual_cloze']).toFixed(3)
item.scores['visual_ordering']=parseFloat(item.scores['visual_ordering']).toFixed(3)
var submission = item["submission"]
var created = item['submission']['created']
var submissionInfo = item['submission']['description'];
item.created = moment.unix(created).format('MMM DD, YYYY');
item.config = data.config;
}
var rendered = Mustache.render(template, ms_data);
$('#container').html(rendered);
}).fail(function () {
$('#container').html('This leaderboard is not ready yet.');
});
})(jQuery);
</script>