From d53ddeb7b0f72664433c98c52f562e56f335a81a Mon Sep 17 00:00:00 2001
From: HsinYingLee <james371507@gmail.com>
Date: Wed, 30 Oct 2024 11:42:12 -0700
Subject: [PATCH] update sfm url

---
 index.html          |  58 +++++++++++++++++++++-----------------------
 resources/.DS_Store | Bin 10244 -> 0 bytes
 2 files changed, 28 insertions(+), 30 deletions(-)
 delete mode 100644 resources/.DS_Store
diff --git a/index.html b/index.html
index c984725..5942166 100644
--- a/index.html
+++ b/index.html
@@ -10,7 +10,7 @@
   <!-- <link rel="stylesheet" href="./static/css/bulma.min.css">
   <link rel="stylesheet" href="./static/css/bulma-carousel.min.css">
   <link rel="stylesheet" href="./static/css/bulma-slider.min.css"> -->
-  
+
   <link rel="stylesheet" href="./static/css/fontawesome.all.min.css">
   <link rel="stylesheet"
         href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
@@ -108,7 +108,7 @@
     height: 30px;
   }
 </style>
-  
+
 </head>
 
 <body>
@@ -117,7 +117,7 @@ <h1 style="line-height: 1.2;">
       <!-- <img src="./icons/demon_logo_transparent.png" alt="D3Mon Icon" style="width: 48px; vertical-align: middle;"> -->
       <!-- <strong><span style="color:rgb(255, 195, 21);">DELTA:</span> Dense Long-range 3D Tracking</strong> -->
       <strong>DELTA: Dense Efficient Long-range <br> 3D Tracking for Any video</strong>
-    </h1>    
+    </h1>
     <p id="authors">
       <span>
         <a href="https://ngoductuanlhp.github.io//">Tuan Duc Ngo<sup>1,2</sup></a>
@@ -142,9 +142,9 @@ <h1 style="line-height: 1.2;">
       </span>
       <br>
       <span class="institution">
-        <a href="https://research.snap.com/"><sup>1</sup> Snap Inc</a> 
+        <a href="https://research.snap.com/"><sup>1</sup> Snap Inc</a>
         <a href="https://www.cics.umass.edu/"><sup>2</sup> UMass Amherst</a>
-        <a href="https://www.ece.tuc.gr/en/home"><sup>3</sup> TU Crete</a> 
+        <a href="https://www.ece.tuc.gr/en/home"><sup>3</sup> TU Crete</a>
         <a href="https://mitibmwatsonailab.mit.edu/"><sup>4</sup> MIT-IBM Watson AI Lab</a>
       </span>
     </p>
@@ -165,15 +165,15 @@ <h1 style="line-height: 1.2;">
       <video class='round' autoplay muted loop playsinline style='width: 800px' src='resources/demo_trajs/car-roundabout_traj_concat.mp4'></video>
       </div>
     </center>
-    
+
     <br>
-  
+
     <center>
       <div class="video-container">
       <video class='round' autoplay muted loop playsinline style='width: 800px' src='resources/demo_trajs/butterfly_traj_concat.mp4'></video>
       </div>
     </center>
-    
+
     <br>
 
     <center>
@@ -181,7 +181,7 @@ <h1 style="line-height: 1.2;">
       <video class='round' autoplay muted loop playsinline style='width: 800px' src='resources/demo_trajs/tortoise_swim.mp4'></video>
       </div>
     </center>
-    
+
     <br>
 
     <center>
@@ -189,17 +189,17 @@ <h1 style="line-height: 1.2;">
       <video class='round' autoplay muted loop playsinline style='width: 800px' src='resources/demo_trajs/yellow-duck.mp4'></video>
       </div>
     </center>
-    
+
 
     <a style="text-align:center">
-      <p> 
+      <p>
         <center>
-          </strong><strong>DELTA</strong> captures <strong>dense, 3D, long-range</strong> trajectories from casual in-the-wild videos in a <strong>feed-forward</strong> manner. 
+          </strong><strong>DELTA</strong> captures <strong>dense, 3D, long-range</strong> trajectories from casual in-the-wild videos in a <strong>feed-forward</strong> manner.
         </center>
       </p>
     </a>
 
-    
+
   </div>
 
 
@@ -210,23 +210,23 @@ <h2 style="text-align:left;">Intro Video (1min)</h2>
     </video>
   </div> -->
 
-  
+
 
   <div class="content">
     <h2 style="text-align:left;"><strong>Abstract</strong></h2>
     <font size="-0.">
       <p>
-          Tracking dense 3D motion from monocular videos remains challenging, particularly 
-          when aiming for pixel-level precision over long sequences. We introduce DELTA, 
-          a novel method that efficiently tracks every pixel in 3D space, enabling accurate 
+          Tracking dense 3D motion from monocular videos remains challenging, particularly
+          when aiming for pixel-level precision over long sequences. We introduce DELTA,
+          a novel method that efficiently tracks every pixel in 3D space, enabling accurate
           motion estimation across entire videos. Our approach leverages a joint
           global-local attention mechanism for reduced-resolution tracking, followed by a
-          transformer-based upsampler to achieve high-resolution predictions. Unlike existing 
+          transformer-based upsampler to achieve high-resolution predictions. Unlike existing
           methods, which are limited by computational inefficiency or sparse tracking,
           DELTA delivers dense 3D tracking at scale, running over 8x faster than
           previous methods while achieving state-of-the-art accuracy. Furthermore, we explore
           the impact of depth representation on tracking performance and identify
-          log-depth as the optimal choice. Extensive experiments demonstrate the superiority 
+          log-depth as the optimal choice. Extensive experiments demonstrate the superiority
           of DELTA on multiple benchmarks, achieving new state-of-the-art results in
           both 2D and 3D dense tracking tasks. Our method provides a robust solution for
           applications requiring fine-grained, long-term motion tracking in 3D space.
@@ -239,7 +239,7 @@ <h2 style="text-align:left;"><strong>Motivation</strong></h2>
     <img class="summary-img" src="./resources/combined.png" style="width:95%;margin-bottom: -10px;">
     <br>
     <p> Existing motion prediction methods struggle with short-term, sparse predictions and often fail to deliver accurate 3D motion estimations while optimization-based approaches require substantial time to process a single video.
-      We are the first method capable of <strong>efficiently</strong> tracking <strong>every pixel</strong> in <strong>3D space</strong> over <strong>hundreds of frames</strong> from monocular videos, and achieves 
+      We are the first method capable of <strong>efficiently</strong> tracking <strong>every pixel</strong> in <strong>3D space</strong> over <strong>hundreds of frames</strong> from monocular videos, and achieves
       <strong>state-of-the-art accuracy</strong> on 3D tracking benchmarks.
     </p>
   </div>
@@ -302,7 +302,7 @@ <h2 style="text-align:left;"><strong>More results</strong></h2>
 
               </table>
             </div>
-            
+
             <div class="item">
               <table align=center width=900px>
               <tr>
@@ -414,16 +414,14 @@ <h2 style="text-align:left;"><strong>Non-rigid Structure from motion</strong></h
     <br>
     <center>
       <iframe
-        width="800px" height="400px" src="http://localhost:8000/build/?playbackPath=http://localhost:8000/resources/viser_records/recording_car-roundabout.viser&initDistanceScale=0.3&initHeightOffset=0.1">
-
-        <!-- width="800px" height="400px" src="https://snap-research.github.io/DELTA/build/?playbackPath=https://snap-research.github.io/DELTA/resources/viser_records/recording_car-roundabout.viser&initDistanceScale=0.3&initHeightOffset=0.1"> -->
+        width="800px" height="400px" src="https://snap-research.github.io/DELTA/build/?playbackPath=https://snap-research.github.io/DELTA/resources/viser_records/recording_car-roundabout.viser&initDistanceScale=0.3&initHeightOffset=0.1">
       </iframe>
     </center>
 
     <br>
 
-    We first densely track pixels across multiple keyframes in the video to obtain pairwise correspondences. 
-    Using these correspondences, we jointly estimate per-keyframe depth maps and camera poses through the Global Alignment in 
+    We first densely track pixels across multiple keyframes in the video to obtain pairwise correspondences.
+    Using these correspondences, we jointly estimate per-keyframe depth maps and camera poses through the Global Alignment in
     <a href="https://dust3r.europe.naverlabs.com/">DUSt3R</a> and <a href="https://monst3r-project.github.io/">MonST3R</a>.
   </div>
 
@@ -440,7 +438,7 @@ <h2 style="text-align:left;"><strong>Consistent video editting in 3D space</stro
     </center>
 
     <br>
-  
+
     <center>
       <div class="video-container">
       <video class='round' autoplay muted loop playsinline style='height:260px' src='resources/edit_videos/rollerblade_edit_concat.mp4'></video>
@@ -449,7 +447,7 @@ <h2 style="text-align:left;"><strong>Consistent video editting in 3D space</stro
     </center>
 
     <br>
-  
+
     <center>
       <div class="video-container">
       <video class='round' autoplay muted loop playsinline style='height:260px' src='resources/edit_videos/scoccerball_edit_concat.mp4'></video>
@@ -474,8 +472,8 @@ <h4 class="title is-3"> More quantitative results can be found in our paper </h4
 <footer class="footer">
   <div class="content">
     <p>
-      <strong>Acknowledgements:</strong> We borrow this template from <a href="https://monst3r-project.github.io/">MonST3R</a> and <a href="https://snap-research.github.io/4Real/">4Real</a>. 
-      The tracking visualization is inspired by <a href="https://co-tracker.github.io/">CoTracker</a>. The camera pose visualization tool is borrowed from <a href="https://monst3r-project.github.io/">MonST3R</a>. 
+      <strong>Acknowledgements:</strong> We borrow this template from <a href="https://monst3r-project.github.io/">MonST3R</a> and <a href="https://snap-research.github.io/4Real/">4Real</a>.
+      The tracking visualization is inspired by <a href="https://co-tracker.github.io/">CoTracker</a>. The camera pose visualization tool is borrowed from <a href="https://monst3r-project.github.io/">MonST3R</a>.
       We sincerely thank the authors for publishing the source code.
       <!-- This website is built using the template of <a href="https://snap-research.github.io/4Real/">4Real</a> and <a href="https://monst3r-project.github.io/">MonST3R</a>. -->
     </p>
diff --git a/resources/.DS_Store b/resources/.DS_Store
deleted file mode 100644
index f33bef12ad35c3206c7e5b4b59443ad925de2d4c..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 10244
zcmeHM%}*0S6o1=Rx}^{?5%oe`Vq!cHpb<r4Fr`)#;z46Y4+wSJt+cw`X}X0T2uaU=
zBp&=D^k4`lJbCnH<iuJ31#h18&4+Zl>~3o!hBPzD?%R*|+nM>jUuWh`0YJ;FTPXko
z0CYU49T~!tPoeMWai~PZlPR<s;sGY11`ez(+N5~MTRl(=C<YV*iUGxdV&FJ1fO9r2
zdXigpRtzWx6axng(DA{*gW9yPEpFM+fhU#%ppD^UR`4400ERJyO$*!NmO=5GJbTat
zR1+zN#^LzhpzdhX!nU~OaL_m$G*PoAG8B!~jyQw4gO=u2ofQL$fx`^Y++7C~>QIET
zoWB=rQowikbBgYuo&3cL`@kSrP=YED$U_5>COiX|=KO7p_OlmEq3PBH=3}8|SKP+*
z^u88}#!d{x<B51OzLG1GX0Bm2*4>O*U#52t2(b%)uFb;3N~xJ2Ien8j4YT5u>I_h^
zO6c<VQN^)HGeg!L%VpRcf00P&iTud9&CS$oYQnfOw>4pGre<d5CXCsct6N(Mee}ZA
z_51nfcGV#-SdT#y!wwAd`-AgKyz=G4a*K8W+e$rs9qhGKu1Kmi>JWLgOe^s9tCDP1
zkfbNit}N`9KQ9FPT0Q&L%5wd0Xfu54-^kS+n>cIup0;s_1>XS|C6I>=sIYtD6#&pS
z%AyIx^@#`q`zOa)k6io^#-SYRyYut6&pc(Z4*YhNwBy~2zZ`Qt%A^<gZBN{j7;g)s
z-3X2PwkPTVs6L5#K=0(Aet?TC3NUYcLD~X5Wl5wLKMm}!GD!q_w*}GNTb2Wu_plK`
zt?-E96xb+*s*nSn2^x4!aPQakpF?8jJ;E47?>b^ahL8vya^xYz7t<$F^6i@}BwvRP
z8705|K*D_eWDx<hMt7FP9O4rMc}(f%+aaLj9#-#PzeheNQ7$I_RlsMD%Q&v&Q8+cW
z48eKDvy`AytSo~r=spodmtJ;6ekt-AIqHItHE?bB-5oKvbVaoXl-^Mtx>#cKOqY5*
z3K?eFplggeYNL*}$Oa6{yUvJw$DS`pi_;KfpC}`whq5Zh#>d|xHzD4#BDUv>dt-cM
z8H#ADp*MuAgt7PEut8xh@~D7%tD+cC3>*mqQT|nf?*HEk{{R0->Q*0B3@8SU2LoCx
zo6BafEp&g!uh6}A1CJ+o&_exM+%gEB*mgWxwjGZ*bUXeM9@KZ5T3YZrEo_The1he_
n{~7R)HvR&Va5-%YaFG{kD*yN2LR9&`EF|B&zC%WTm;e6;CiT(Z