assembly-101
diff --git a/‎docs/assets/12_view_assembly.mp4
10.9 MB b/‎docs/assets/12_view_assembly.mp4
10.9 MB
diff --git a/‎docs/assets/Assembly101.pdf
1.81 MB b/‎docs/assets/Assembly101.pdf
1.81 MB
diff --git a/‎docs/assets/Assembly101_supp.pdf
2.46 MB b/‎docs/assets/Assembly101_supp.pdf
2.46 MB
diff --git a/‎docs/assets/assembly101_rig.png
1.72 MB b/‎docs/assets/assembly101_rig.png
1.72 MB
diff --git a/‎docs/assets/teaser_rig_new.pdf
214 KB b/‎docs/assets/teaser_rig_new.pdf
214 KB
diff --git a/‎docs/index.html
Lines changed: 312 additions & 0 deletions b/‎docs/index.html
Lines changed: 312 additions & 0 deletions
@@ -0,0 +1,312 @@
+<!DOCTYPE html>
+<meta charset="utf-8">
+
+<html>
+
+<style type="text/css">
+body {
+	font-family: "Titillium Web", "HelveticaNeue-Light", "Helvetica Neue Light", "Helvetica Neue", Helvetica, Arial, "Lucida Grande", sans-serif;
+	font-weight: 300;
+	font-size: 17px;
+	margin-left: auto;
+	margin-right: auto;
+	width: 980px;
+}
+h1 {
+	font-weight:300;
+	line-height: 1.15em;
+}
+
+h2 {
+	font-size: 1.75em;
+}
+a:link,a:visited {
+	color: #1367a7;
+	text-decoration: none;
+}
+a:hover {
+	color: #208799;
+}
+h1, h2, h3 {
+	text-align: center;
+}
+h1 {
+	font-size: 40px;
+	font-weight: 500;
+}
+h2, h3 {
+	font-weight: 400;
+	margin: 16px 0px 4px 0px;
+}
+.paper-title {
+	padding: 16px 0px 16px 0px;
+}
+section {
+	margin: 32px 0px 32px 0px;
+	text-align: justify;
+	clear: both;
+}
+.col-5 {
+	 width: 20%;
+	 float: left;
+}
+.col-4 {
+	 width: 25%;
+	 float: left;
+}
+.col-2 {
+	 width: 50%;
+	 float: left;
+}
+.row, .author-row, .affil-row {
+	 overflow: auto;
+}
+.author-row, .affil-row {
+	font-size: 20px;
+}
+.row {
+	margin: 16px 0px 16px 0px;
+}
+.authors {
+	font-size: 18px;
+}
+.affil-row {
+	margin-top: 16px;
+}
+.teaser {
+	max-width: 100%;
+}
+.text-center {
+	text-align: center;
+}
+.screenshot {
+	width: 256px;
+	border: 1px solid #ddd;
+}
+.screenshot-el {
+	margin-bottom: 16px;
+}
+hr {
+	height: 1px;
+	border: 0;
+	border-top: 1px solid #ddd;
+	margin: 0;
+}
+.material-icons {
+	vertical-align: -6px;
+}
+p {
+	line-height: 1.25em;
+}
+.caption_justify {
+	font-size: 16px;
+	color: #666;
+	text-align: justify;
+	margin-top: 0px;
+	margin-bottom: 64px;
+}
+.caption {
+	font-size: 16px;
+	color: #666;
+	text-align: center;
+	margin-top: 8px;
+	margin-bottom: 64px;
+}
+.caption_inline {
+	font-size: 16px;
+	color: #666;
+	text-align: center;
+	margin-top: 8px;
+	margin-bottom: 0px;
+}
+.caption_bold {
+	font-size: 16px;
+	color: #666;
+	text-align: center;
+	margin-top: 0px;
+	margin-bottom: 0px;
+	font-weight: bold;
+}
+video {
+	display: block;
+	margin: auto;
+}
+figure {
+	display: block;
+	margin: auto;
+	margin-top: 10px;
+	margin-bottom: 10px;
+}
+#bibtex pre {
+	font-size: 14px;
+	background-color: #eee;
+	padding: 16px;
+}
+.blue {
+	color: #2c82c9;
+	font-weight: bold;
+}
+.orange {
+	color: #d35400;
+	font-weight: bold;
+}
+.flex-row {
+	display: flex;
+	flex-flow: row wrap;
+	justify-content: space-around;
+	padding: 0;
+	margin: 0;
+	list-style: none;
+}
+.paper-btn {
+  position: relative;
+  text-align: center;
+
+  display: inline-block;
+  margin: 8px;
+  padding: 8px 8px;
+
+  border-width: 0;
+  outline: none;
+  border-radius: 2px;
+
+  background-color: #1367a7;
+  color: #ecf0f1 !important;
+  font-size: 20px;
+  width: 100px;
+  font-weight: 600;
+}
+.paper-btn-parent {
+	display: flex;
+	justify-content: center;
+	margin: 16px 0px;
+}
+.paper-btn:hover {
+	opacity: 0.85;
+}
+.container {
+	margin-left: auto;
+	margin-right: auto;
+	padding-left: 16px;
+	padding-right: 16px;
+}
+.venue {
+	color: #1367a7;
+}
+</style>
+<link href='https://fonts.googleapis.com/css?family=Titillium+Web:400,600,400italic,600italic,300,300italic' rel='stylesheet' type='text/css'>
+<head>
+	<title>Assembly101: A Large-Scale Multi-View Video Dataset for Understanding Procedural Activities</title>
+	<meta property="og:description" content="Assembly101: A Large-Scale Multi-View Video Dataset for Understanding Procedural Activities"/>
+	<link href="https://fonts.googleapis.com/css2?family=Material+Icons" rel="stylesheet">
+</head>
+
+<body>
+<div class="container">
+	<div class="paper-title">
+		<h1>Assembly101: A Large-Scale Multi-View Video Dataset for Understanding Procedural Activities</h1>
+	</div>
+
+	<div id="authors">
+		<div class="author-row">
+			<div class="col-4 text-center"><a href="https://scholar.google.com/citations?user=-juoweoAAAAJ">Fadime Sener<sup>1</sup></a></div>
+			<div class="col-4 text-center"><a href="">Dibyadip Chatterjee<sup>2</sup></a></div>
+			<div class="col-4 text-center"><a href="">Daniel Shelepov<sup>1</sup></a></div>
+			<div class="col-4 text-center"><a href="">Kun He<sup>1</sup></a></div>
+			<div class="col-4 text-center"><a href="">Dipika Singhania<sup>2</sup></a></div>
+			<div class="col-4 text-center"><a href="">Robert Wang<sup>1</sup></a></div>
+			<div class="col-4 text-center"><a href="">Angela Yao<sup>2</sup></a></div>
+		</div>
+
+		<div class="affil-row">
+			<div class="col-1 text-center"><sup>1</sup>Reality Labs at Meta</div>
+			<div class="col-1 text-center"><sup>2</sup>National University of Singapore</div>
+		</div>
+
+		<div style="clear: both">
+			<div class="paper-btn-parent">
+				<a class="paper-btn" href="assets/Assembly101.pdf">
+					<span class="material-icons"> description </span>
+					Paper
+				</a>
+				<a class="paper-btn" href="https://drive.google.com/drive/folders/1nh8PHwEw04zxkkkKlfm4fsR3IPEDvLKj?usp=sharing">
+					<span class="material-icons"> videocam </span>
+					Dataset
+				</a>
+				<a class="paper-btn" href="https://github.com/assembly101/assembly101">
+					<span class="material-icons"> code </span>
+					Code
+				</a>
+			</div>
+		</div>
+	</div>
+
+	<section id="teaser-videos">
+
+		<figure style="width: 100%; float: left">
+			<video class="centered" width="100%" autoplay muted loop playsinline>
+				<source src="assets/12_view_assembly.mp4" type="video/mp4">
+				Your browser does not support the video tag.
+			</video>
+		</figure>
+
+		<figure style="width: 100%; float: left">
+			<p class="caption_justify">
+				Assembly101 is a large-scale video dataset for action recognition and markerless motion capture of hand-object interactions, captured in the above cage setting.
+				The recordings, which are multi-view captures, feature participants assembling 101 children's toys.
+			</p>
+		</figure>
+	</section>
+
+	<section id="news">
+		<h2>News</h2>
+		<hr>
+		<div class="row">
+			<div><span class="material-icons"> description </span> [March 28th 2022] Paper released on <a href="https://arxiv.org/pdf/2203.14712.pdf">arXiv</a>.</div>
+			<div><span class="material-icons"> integration_instructions </span> [March 28th 2022] Dataset released on <a href="https://drive.google.com/drive/folders/1nh8PHwEw04zxkkkKlfm4fsR3IPEDvLKj?usp=sharing">Google Drive</a>.</div>
+		</div>
+	</section>
+
+	<section id="abstract"/>
+		<h2>Abstract</h2>
+		<hr>
+		<p>
+	Assembly101 is a new procedural activity dataset featuring 4321 videos of people assembling and disassembling 101 "take-apart" toy vehicles. Participants work without fixed instructions, and the sequences feature rich and natural variations in action ordering, mistakes, and corrections. Assembly101 is the first multi-view action dataset, with simultaneous static (8) and egocentric (4) recordings. Sequences are annotated with more than 100K coarse and 1M fine-grained action segments, and 18M 3D hand poses. We benchmark on three action understanding tasks: recognition, anticipation and temporal segmentation. Additionally, we propose a novel task of detecting mistakes. The unique recording format and rich set of annotations allow us to investigate generalization to new toys, cross-view transfer, long-tailed distributions, and pose vs. appearance. We envision that Assembly101 will serve as a new challenge to investigate various activity understanding problems.
+		</p>
+	</section>
+
+	<section id="paper">
+		<h2>Paper</h2>
+		<hr>
+		<div class="flex-row">
+			<div style="box-sizing: border-box; padding: 16px; margin: auto;">
+				<a href="assets/paper.pdf"><img class="screenshot" src="assets/assembly101_rig.png"></a>
+			</div>
+			<div style="width: 60%">
+				<p><b>Assembly101: A Large-Scale Multi-View Video Dataset for Understanding Procedural Activities</b></p>
+				<p>Fadime Sener, Dibyadip Chatterjee, Daniel Shelepov, Kun He, Dipika Singhania, Robert Wang, Angela Yao</p>
+
+				<div><span class="material-icons"> description </span><a href="assets/Assembly101.pdf"> Paper preprint </a></div>
+				<div><span class="material-icons"> description </span><a href="assets/Assembly101_supp.pdf"> Supplementary </a></div>
+				<div><span class="material-icons"> description </span><a href="https://arxiv.org/pdf/2203.14712.pdf"> arXiv version</a></div>
+				<div><span class="material-icons"> integration_instructions </span><a href="https://github.com/assembly101/assembly101"> Code</a></div>
+<!--				<div><span class="material-icons"> videocam </span><a href="https://youtu.be/asdf"> Video</a></div>-->
+
+				<p>Please send feedback and questions to <tt>3dassembly101&lt;at&gt;gmail.com</tt></p>
+			</div>
+		</div>
+	</section>
+
+	<section id="bibtex">
+		<h2>Citation</h2>
+		<hr>
+		<pre><code>@article{sener2022assembly101,
+    title = {Assembly101: A Large-Scale Multi-View Video Dataset for Understanding Procedural Activities},
+    author = {F. Sener and D. Chatterjee and D. Shelepov and K. He and D. Singhania and R. Wang and A. Yao},
+    journal = {CVPR 2022},
+}
+</code></pre>
+	</section>
+</div>
+</body>
+</html>