index.html

<script src="http://www.google.com/jsapi" type="text/javascript"></script>
<script type="text/javascript">google.load("jquery", "1.3.2");</script>

<style type="text/css">
    body {
        font-family: "HelveticaNeue-Light", "Helvetica Neue Light", "Helvetica Neue", Helvetica, Arial, "Lucida Grande", sans-serif;
        font-weight:300;
        font-size:18px;
        margin-left: auto;
        margin-right: auto;
        width: 1100px;
    }

    h1 {
        font-size:32px;
        font-weight:300;
    }

    .disclaimerbox {
        background-color: #eee;
        border: 1px solid #eeeeee;
        border-radius: 10px ;
        -moz-border-radius: 10px ;
        -webkit-border-radius: 10px ;
        padding: 20px;
    }

    video.header-vid {
        height: 140px;
        border: 1px solid black;
        border-radius: 10px ;
        -moz-border-radius: 10px ;
        -webkit-border-radius: 10px ;
    }

    img.header-img {
        height: 140px;
        border: 1px solid black;
        border-radius: 10px ;
        -moz-border-radius: 10px ;
        -webkit-border-radius: 10px ;
    }

    img.rounded {
        border: 1px solid #eeeeee;
        border-radius: 10px ;
        -moz-border-radius: 10px ;
        -webkit-border-radius: 10px ;
    }

    a:link,a:visited {
        color: #1367a7;
        text-decoration: none;
    }

    a:hover {
        color: #208799;
    }

    td.dl-link {
        height: 160px;
        text-align: center;
        font-size: 22px;
    }

    .layered-paper-big { /* modified from: http://css-tricks.com/snippets/css/layered-paper/ */
        box-shadow:
                0px 0px 1px 1px rgba(0,0,0,0.35), /* The top layer shadow */
                5px 5px 0 0px #fff, /* The second layer */
                5px 5px 1px 1px rgba(0,0,0,0.35), /* The second layer shadow */
                10px 10px 0 0px #fff, /* The third layer */
                10px 10px 1px 1px rgba(0,0,0,0.35), /* The third layer shadow */
                15px 15px 0 0px #fff, /* The fourth layer */
                15px 15px 1px 1px rgba(0,0,0,0.35), /* The fourth layer shadow */
                20px 20px 0 0px #fff, /* The fifth layer */
                20px 20px 1px 1px rgba(0,0,0,0.35), /* The fifth layer shadow */
                25px 25px 0 0px #fff, /* The fifth layer */
                25px 25px 1px 1px rgba(0,0,0,0.35); /* The fifth layer shadow */
        margin-left: 10px;
        margin-right: 45px;
    }

    .paper-big { /* modified from: http://css-tricks.com/snippets/css/layered-paper/ */
        box-shadow:
                0px 0px 1px 1px rgba(0,0,0,0.35); /* The top layer shadow */

        margin-left: 10px;
        margin-right: 45px;
    }

    .layered-paper { /* modified from: http://css-tricks.com/snippets/css/layered-paper/ */
        box-shadow:
                0px 0px 1px 1px rgba(0,0,0,0.35), /* The top layer shadow */
                5px 5px 0 0px #fff, /* The second layer */
                5px 5px 1px 1px rgba(0,0,0,0.35), /* The second layer shadow */
                10px 10px 0 0px #fff, /* The third layer */
                10px 10px 1px 1px rgba(0,0,0,0.35); /* The third layer shadow */
        margin-top: 5px;
        margin-left: 10px;
        margin-right: 30px;
        margin-bottom: 5px;
    }

    .vert-cent {
        position: relative;
        top: 50%;
        transform: translateY(-50%);
    }

    hr {
        border: 0;
        height: 1px;
        background-image: linear-gradient(to right, rgba(0, 0, 0, 0), rgba(0, 0, 0, 0.75), rgba(0, 0, 0, 0));
    }
</style>

<html>
    <head>
        <title>SphereCraft</title>
        <meta property="og:title" content="SphereCraft webpage" />
        <meta property="og:description" content="Gava et al. 2023" />
    </head>

    <body>
        <br>
        <center>
            <span style="font-size:36px">SphereCraft: A Dataset for Spherical Keypoint Detection, <br> Matching and Camera Pose Estimation</span>
        </center>

        <table align=center width=800px>
            <tr>
                <td align=center width=300px>
                    <center>
                        <span style="font-size:20px"><a href="https://www.linkedin.com/in/christiano-gava-b6b5164a/"> Christiano Gava <sup>1</sup> </a></span>
                    </center>
                </td>
                <td align=center width=150px>
                    <center>
                        <span style="font-size:20px"><a href="https://www.linkedin.com/in/yunmin-cho-773176197/"> Yunmin Cho<sup>2</sup></a></span>
                    </center>
                </td>
                <td align=center width=150px>
                    <center>
                        <span style="font-size:20px"><a href="https://de.linkedin.com/in/rave78"> Federico Raue <sup>1</sup></a></span>
                    </center>
                </td>
                <td align=center width=150px>
                    <center>
                        <span style="font-size:20px"><a href="https://de.linkedin.com/in/spalaciob"> Sebastian Palacio <sup>1</sup></a></span>
                    </center>
                </td>
                <td align=center width=150px>
                    <center>
                        <span style="font-size:20px"><a href="https://av.dfki.de/members/pagani/"> Alain Pagani <sup>1</sup></a></span>
                    </center>
                </td>
                <td align=center width=150px>
                    <center>
                        <span style="font-size:20px"><a href="https://www.dfki.uni-kl.de/~dengel/indexEng.php"> Andreas Dengel <sup>1,3</sup></a></span>
                    </center>
                </td>
            </tr>
            <tr>
                <td align=center width=200px> <sup>1</sup> DFKI</td>
                <td colspan="2" align=center width=200px> <sup>2</sup> Aimmo Germany GmbH</td>
                <td colspan="3" align=center width=200px> <sup>3</sup> University of Kaiserslautern-Landau</td>
            </tr>
        </table>
        <br>
        <table align=center width=800px>
            <tr>
                <td width=200px>
                    <center>
                        <img class="round" style="width:200px" src="./resources/vitoria_topview_mesh.png"/>
                    </center>
                </td>
                <td width=200px>
                    <center>
                        <img class="round" style="width:200px" src="./resources/vitoria_170_198.jpg"/>
                    </center>
                </td>
                <td width=200px>
                    <center>
                        <img class="round" style="width:200px" src="./resources/vitoria_depth_170_198.jpg"/>
                    </center>
                </td>
                <td width=200px>
                    <center>
                        <img class="round" style="width:200px" src="./resources/vitoria_superpoint_gt_matches_00000170_00000198.jpg"/>
                    </center>
                </td>
            </tr>
            <tr>
                <td align=center width=200px>
                    <span><a href="https://www.blender.org/">Blender </a> projects + 3D meshes</span>
                </td>
                <td align=center width=200px>
                    <span> Spherical images </span>
                </td>
                <td align=center width=200px>
                    <span> Depth maps </span>
                </td>
                <td align=center width=200px>
                    <span> Ground truth keypoint correspondences </span>
                </td>
            </tr>
        </table>
        <hr>
        <table align="center" width=800px>
            <center> Accepted at WACV-2024 </center>
        </table>

        <table align=center width=800px>
            <center><h1>Abstract</h1></center>
            <tr>
                <td>
                    <div align="justify">
                        This paper introduces SphereCraft, a dataset specifically designed for spherical keypoint detection, matching, and camera pose estimation.
                        The dataset addresses the limitations of existing datasets by providing extracted keypoints from various detectors, along with their ground-truth correspondences.
                        Synthetic scenes with photo-realistic rendering and accurate 3D meshes are included, as well as real-world scenes acquired from different spherical cameras.
                        SphereCraft enables the development and evaluation of algorithms targeting multiple camera viewpoints, advancing the state-of-the-art in computer vision tasks involving spherical images.
                    </div>
                </td>
            </tr>
        </table>

        <hr>

        <table align="center" width=900px>
            <center><h1> Overview </h1></center>
            <tr>
                <td>
                    <span style="font-size:20px"> Synthetic Scenes </span>
                </td>
            </tr>
            <tr>
                <td>
                    <div align="justify">
                        Our dataset comprises 21 synthetic scenes of different types, sizes, and complexity and yields over 2M image pairs for training and testing spherical keypoint matching models.
                        We generate indoor and outdoor synthetic scenes with high-resolution RGB spherical images along with their depth maps and ground truth camera poses.
                        A selection of popular handcrafted and learned keypoints is then extracted from each image and accurate ground truth keypoint correspondences are established.
                        A highly accurate 3D mesh from each synthetic scene is also included.
                        The resulting data (RGB images, depth maps, camera poses, 3D meshes, keypoints and their correspondences) allows future approaches to be trained and evaluated on exactly the same data.
                        Additionally, we release all <a href="https://www.blender.org/">Blender </a> projects so other researchers can optionally render the same scenes at different resolutions or create their own version of the data according to their needs.
                        <br><br>
                        For each synthetic scene, we manually place a set of cameras to homogeneously cover it.
                        We refer to this initial set as <i>anchor</i> cameras.
                        For each anchor camera, we randomly generate a set of <i>satellite</i> cameras in its vicinity.
                        Akin to data augmentation, the idea is to automatically produce several novel views of the scene from many different positions and orientations.
                        For instance, the figure below shows an anchor image (top left) along with its 9 satellite images.
                    </div>
                </td>
            </tr>
            <tr>
                <table align="center" width=900px>
                    <tr>
                        <td width=180px>
                            <center>
                                <img class="round" style="width:180px" src="./resources/harmony_anchor_00000000.jpg"/>
                            </center>
                        </td>
                        <td width=180px>
                            <center>
                                <img class="round" style="width:180px" src="./resources/harmony_satellite_00000001.jpg"/>
                            </center>
                        </td>
                        <td width=180px>
                            <center>
                                <img class="round" style="width:180px" src="./resources/harmony_satellite_00000002.jpg"/>
                            </center>
                        </td>
                        <td width=180px>
                            <center>
                                <img class="round" style="width:180px" src="./resources/harmony_satellite_00000003.jpg"/>
                            </center>
                        </td>
                        <td width=180px>
                            <center>
                                <img class="round" style="width:180px" src="./resources/harmony_satellite_00000004.jpg"/>
                            </center>
                        </td>
                    </tr>
                    <tr>
                        <td width=180px>
                            <center>
                                <img class="round" style="width:180px" src="./resources/harmony_satellite_00000005.jpg"/>
                            </center>
                        </td>
                        <td width=180px>
                            <center>
                                <img class="round" style="width:180px" src="./resources/harmony_satellite_00000006.jpg"/>
                            </center>
                        </td>
                        <td width=180px>
                            <center>
                                <img class="round" style="width:180px" src="./resources/harmony_satellite_00000007.jpg"/>
                            </center>
                        </td>
                        <td width=180px>
                            <center>
                                <img class="round" style="width:180px" src="./resources/harmony_satellite_00000008.jpg"/>
                            </center>
                        </td>
                        <td width=180px>
                            <center>
                                <img class="round" style="width:180px" src="./resources/harmony_satellite_00000009.jpg"/>
                            </center>
                        </td>
                    </tr>
                </table>
            </tr>
        </table>

        <br>

        <table align="center" width=900px>
            <tr>
                <td>
                    <div align="justify">
                        The resolution of the rendered spherical images and depth maps is 2048x1024 pixels.
                        Below is a sample from each synthetic scene.
                        The number in parenthesis indicates the number of images in that scene.
                    </div>
                </td>
            </tr>
        </table>

        <table align=center width=900px>
            <tr>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/bank_00000160.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/barbershop_00000020.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/berlin_00000140.jpg"/>
                    </center>
                </td>
            </tr>
            <tr>
                <td align=center width=300px>
                    <span> Bank (930) </span>
                </td>
                <td align=center width=300px>
                    <span> Barbershop (80) </span>
                </td>
                <td align=center width=300px>
                    <span> Berlin (280) </span>
                </td>
            </tr>

            <tr>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/classroom_00000210.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/garage_00001080.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/harmony_00000250.jpg"/>
                    </center>
                </td>
            </tr>
            <tr>
                <td align=center width=300px>
                    <span> Classroom (370) </span>
                </td>
                <td align=center width=300px>
                    <span> Garage (1090) </span>
                </td>
                <td align=center width=300px>
                    <span> Harmony (380) </span>
                </td>
            </tr>

            <tr>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/italianFlat_00000040.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/kartu_00000180.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/loneMonk_00000560.jpg"/>
                    </center>
                </td>
            </tr>
            <tr>
                <td align=center width=300px>
                    <span> Italian Flat (270) </span>
                </td>
                <td align=center width=300px>
                    <span> Kartu (640) </span>
                </td>
                <td align=center width=300px>
                    <span> Lone Monk (670) </span>
                </td>
            </tr>

            <tr>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/medievalPort_00000000.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/middleEast_00002030.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/passion_00000240.jpg"/>
                    </center>
                </td>
            </tr>
            <tr>
                <td align=center width=300px>
                    <span> Medieval Port (2160) </span>
                </td>
                <td align=center width=300px>
                    <span> Middle East (4300) </span>
                </td>
                <td align=center width=300px>
                    <span> Passion (600) </span>
                </td>
            </tr>

            <tr>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/rainbow_00000440.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/seoul_00000080.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/shapespark_00000200.jpg"/>
                    </center>
                </td>
            </tr>
            <tr>
                <td align=center width=300px>
                    <span> Rainbow (930) </span>
                </td>
                <td align=center width=300px>
                    <span> Seoul (330) </span>
                </td>
                <td align=center width=300px>
                    <span> Shapespark (860) </span>
                </td>
            </tr>

            <tr>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/showroom_00001170.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/simple_00000260.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/tokyo_00000040.jpg"/>
                    </center>
                </td>
            </tr>
            <tr>
                <td align=center width=300px>
                    <span> Showroom (1340) </span>
                </td>
                <td align=center width=300px>
                    <span> Simple (310) </span>
                </td>
                <td align=center width=300px>
                    <span> Tokyo (90) </span>
                </td>
            </tr>

            <tr>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/urbanCanyon_00002370.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/vitoria_00000070.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/warehouse_00000340.jpg"/>
                    </center>
                </td>
            </tr>
            <tr>
                <td align=center width=300px>
                    <span> Urban Canyon (4090) </span>
                </td>
                <td align=center width=300px>
                    <span> Vitoria (550) </span>
                </td>
                <td align=center width=300px>
                    <span> Warehouse (900) </span>
                </td>
            </tr>
        </table>

        <br><br>

        <table align="center" width=900px>
            <tr>
                <td>
                    <span style="font-size:20px"> Real-World Scenes </span>
                </td>
            </tr>
            <tr>
                <td>
                    <div align="justify">
                        Along with synthetic scenes, we provide another 9 real scenes, captured with <a href="https://weiss-ag.com/de/"> Civetta </a> and <a href="https://www.ricoh360.com/theta/"> Ricoh </a> Theta-S cameras.
                        They convey 4 indoor and 5 outdoor scenes of different sizes and complexity, with resolutions considerably higher than the synthetic images.
                        Images captured with Civetta are 7070x3535 pixels, whereas those acquired with Theta-S are 5376x2688 pixels.
                        Unlike synthetic scenes, here ground truth depth maps, camera poses and keypoint correspondences are not available, but we provide keypoints extracted at the resolutions aforementioned.
                        Once again, the number in parenthesis indicates the number of images in that scene.
                    </div>
                </td>
            </tr>
        </table>

        <table align=center width=900px>
            <tr>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/berlinStreet_00000083.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/otterbergChurch_00000015.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/corridorAV_00000088.jpg"/>
                    </center>
                </td>
            <tr>
                <td align=center width=300px>
                    <span> Berlin Street (186) </span>
                </td>
                <td align=center width=300px>
                    <span> Church (54) </span>
                </td>
                <td align=center width=300px>
                    <span> Corridors (116) </span>
                </td>
            </tr>

            <tr>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/galileo_00000000.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/pascal_00000000.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/stadiumKL_00000036.jpg"/>
                    </center>
                </td>
            <tr>
                <td align=center width=300px>
                    <span> Meeting Room 1 (18) </span>
                </td>
                <td align=center width=300px>
                    <span> Meeting Room 2 (21) </span>
                </td>
                <td align=center width=300px>
                    <span> Stadium (74) </span>
                </td>
            </tr>

            <tr>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/stMartinsplatz_00000022.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/hauptbahnhof_00000069.jpg"/>
                    </center>
                </td>
                <td width=300px>
                    <center>
                        <img class="round" style="width:300px" src="./resources/uni_00000022.jpg"/>
                    </center>
                </td>
            <tr>
                <td align=center width=300px>
                    <span> Town Square (35) </span>
                </td>
                <td align=center width=300px>
                    <span> Train Station (112) </span>
                </td>
                <td align=center width=300px>
                    <span> Uni (71) </span>
                </td>
            </tr>
        </table>

        <hr>

        <table align="center" width=900px>
            <center><h1> Download SphereCraft </h1></center>
            <tr>
                <td>
                    <div align="justify">
                        Our dataset is available at <a href="https://zenodo.org/">Zenodo</a>.
                        It comprises a total of 9 records.
                        Although it is possible to download SphereCraft using Zenodo's web interface, we recommend the download script we release in SphereCraft's <a href="https://github.com/DFKI/spherecrafthub">Github page</a>.
                    </div>
                </td>
            </tr>
        </table>

        <hr>

        <table align="center" width=900px>
            <center><h1> Code and more details </h1></center>
            <tr>
                <td>
                    <div align="justify">
                        Please visit SphereCraft's <a href="https://github.com/DFKI/spherecrafthub">Github page</a>.
                    </div>
                </td>
            </tr>
        </table>

        <hr>

        <table align="center" width=900px>
            <tr>
                <td>
                    <div align="justify">
                        The template for this website is borrowed from <a href="https://richzhang.github.io/">Richard Zhang</a>.
                    </div>
                </td>
            </tr>
        </table>
    </body>
</html>