@article{https://authors.library.caltech.edu/records/v8v89-3xq78,
    title = "CellSAM: a foundation model for cell segmentation",
    journal = "Nature Methods",
    year = "2025",
    url = "https://authors.library.caltech.edu/records/v8v89-3xq78",
    id = "record",
    issn = "1548-7091",
    doi = "10.1038/s41592-025-02879-w",
    volume = "22"
}


@inbook{https://authors.library.caltech.edu/records/6ktpc-y4q09,
    chapter = "Caltech Aerial RGB-Thermal Dataset in the Wild",
    journal = "Computer Vision – ECCV 2024",
    year = "2024",
    url = "https://authors.library.caltech.edu/records/6ktpc-y4q09",
    id = "record",
    isbn = "978-3-031-73035-1",
    doi = "10.1007/978-3-031-73036-8\_14"
}


@other{https://authors.library.caltech.edu/records/0n803-rzq26,
    title = "Reconstructing Hand-Held Objects in 3D",
    year = "2024",
    url = "https://authors.library.caltech.edu/records/0n803-rzq26",
    id = "record",
    doi = "10.48550/arxiv.2404.06507"
}


@other{https://authors.library.caltech.edu/records/47sqx-33w78,
    title = "A Foundation Model for Cell Segmentation",
    journal = "bioRvix",
    year = "2024",
    url = "https://authors.library.caltech.edu/records/47sqx-33w78",
    id = "record",
    issn = "2692-8205",
    doi = "10.1101/2023.11.17.567630",
    pmcid = "PMC10690226"
}


@other{https://authors.library.caltech.edu/records/stvvz-was45,
    title = "TOTEM: TOkenized Time Series EMbeddings for General Time Series Analysis",
    year = "2024",
    url = "https://authors.library.caltech.edu/records/stvvz-was45",
    id = "record",
    doi = "10.48550/arxiv.2402.16412"
}


@other{https://authors.library.caltech.edu/records/s7ywd-z4m89,
    title = "Pixel-Aligned Recurrent Queries for Multi-View 3D Object Detection",
    year = "2023",
    url = "https://authors.library.caltech.edu/records/s7ywd-z4m89",
    id = "record",
    isbn = "979-8-3503-0718-4",
    doi = "10.1109/ICCV51070.2023.01684"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20230316-204045919,
    title = "Multiview Compressive Coding for 3D Reconstruction",
    year = "2023",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20230316-204045919",
    id = "record"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-215117759,
    title = "Building Generalizable Agents with a Realistic and Rich 3D Environment",
    year = "2022",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-215117759",
    id = "record"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204745839,
    title = "BKinD-3D: Self-Supervised 3D Keypoint Discovery from Multi-View Videos",
    year = "2022",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204745839",
    id = "record",
    doi = "10.48550/arXiv.2212.07401"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204749212,
    title = "Omni3D: A Large Benchmark and Model for 3D Object Detection in the Wild",
    year = "2022",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204749212",
    id = "record",
    doi = "10.48550/arXiv.2207.10660"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204752587,
    title = "Learning 3D Object Shape and Layout without 3D Supervision",
    year = "2022",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204752587",
    id = "record",
    doi = "10.48550/arXiv.2206.07028"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789792000.24,
    title = "2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)",
    chapter = "Differentiable Stereopsis: Meshes from multiple views using differentiable rendering",
    year = "2022",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789792000.24",
    id = "record",
    isbn = "978-1-6654-6946-3",
    doi = "10.1109/cvpr52688.2022.00844"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789795000.26,
    title = "2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)",
    chapter = "Learning 3D Object Shape and Layout without 3D Supervision",
    year = "2022",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789795000.26",
    id = "record",
    isbn = "978-1-6654-6946-3",
    doi = "10.1109/cvpr52688.2022.00174"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204759329,
    title = "Recognizing Scenes from Novel Viewpoints",
    year = "2021",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204759329",
    id = "record",
    doi = "10.48550/arXiv.2112.01520"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204755957,
    title = "Differentiable Stereopsis: Meshes from multiple views using differentiable rendering",
    year = "2021",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204755957",
    id = "record",
    doi = "10.48550/arXiv.2110.05472"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204802712,
    title = "Accelerating 3D Deep Learning with PyTorch3D",
    year = "2020",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204802712",
    id = "record",
    doi = "10.48550/arXiv.2007.08501"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221219-224850812,
    title = "Advances in Neural Information Processing Systems 33 (NeurIPS 2020)",
    chapter = "3D Shape Reconstruction from Vision and Touch",
    year = "2020",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-224850812",
    id = "record",
    isbn = "9781713829546"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204806086,
    title = "3D Shape Reconstruction from Vision and Touch",
    year = "2020",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204806086",
    id = "record",
    doi = "10.48550/arXiv.2007.03778"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789782000.20,
    title = "2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)",
    chapter = "SynSin: End-to-End View Synthesis From a Single Image",
    year = "2020",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789782000.20",
    id = "record",
    isbn = "978-1-7281-7168-5",
    doi = "10.1109/cvpr42600.2020.00749"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204809456,
    title = "SynSin: End-to-end View Synthesis from a Single Image",
    year = "2019",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204809456",
    id = "record",
    doi = "10.48550/arXiv.1912.08804"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789777000.18,
    title = "2019 IEEE/CVF International Conference on Computer Vision (ICCV)",
    chapter = "Mesh R-CNN",
    year = "2019",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789777000.18",
    id = "record",
    isbn = "978-1-7281-4803-8",
    doi = "10.1109/iccv.2019.00988"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-223825499,
    title = "Mesh R-CNN",
    year = "2019",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-223825499",
    id = "record",
    doi = "10.48550/arXiv.1906.02739"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789772000.17,
    title = "2019 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)",
    chapter = "Embodied Question Answering in Photorealistic Environments With Point Cloud Perception",
    year = "2019",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789772000.17",
    id = "record",
    isbn = "978-1-7281-3293-8",
    doi = "10.1109/cvpr.2019.00682"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789767000.16,
    title = "2019 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)",
    chapter = "Multi-Target Embodied Question Answering",
    year = "2019",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789767000.16",
    id = "record",
    isbn = "978-1-7281-3293-8",
    doi = "10.1109/cvpr.2019.00647"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204819572,
    title = "Multi-Target Embodied Question Answering",
    year = "2019",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204819572",
    id = "record",
    doi = "10.48550/arXiv.1904.04686"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204816196,
    title = "Embodied Question Answering in Photorealistic Environments with Point Cloud Perception",
    year = "2019",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204816196",
    id = "record",
    doi = "10.48550/arXiv.1904.03461"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204822934,
    title = "Neural Modular Control for Embodied Question Answering",
    year = "2018",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204822934",
    id = "record",
    doi = "10.48550/arXiv.1810.11181"
}


@article{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204809634,
    title = "Neural Modular Control for Embodied Question Answering",
    journal = "Proceedings of Machine Learning Research",
    year = "2018",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204809634",
    id = "record",
    issn = "2640-3498",
    volume = "87"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789753000.13,
    title = "2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition",
    chapter = "Detect-and-Track: Efficient Pose Estimation in Videos",
    year = "2018",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789753000.13",
    id = "record",
    isbn = "978-1-5386-6420-9",
    doi = "10.1109/cvpr.2018.00044"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789757000.14,
    title = "2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition",
    chapter = "Embodied Question Answering",
    year = "2018",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789757000.14",
    id = "record",
    isbn = "978-1-5386-6420-9",
    doi = "10.1109/cvpr.2018.00008"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789762000.15,
    title = "2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition",
    chapter = "Detecting and Recognizing Human-Object Interactions",
    year = "2018",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789762000.15",
    id = "record",
    isbn = "978-1-5386-6420-9",
    doi = "10.1109/cvpr.2018.00872"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789751000.12,
    title = "2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition",
    chapter = "Data Distillation: Towards Omni-Supervised Learning",
    year = "2018",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789751000.12",
    id = "record",
    isbn = "978-1-5386-6420-9",
    doi = "10.1109/cvpr.2018.00433"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204826312,
    title = "Building Generalizable Agents with a Realistic and Rich 3D Environment",
    year = "2018",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204826312",
    id = "record",
    doi = "10.48550/arXiv.1801.02209"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204836433,
    title = "Detect-and-Track: Efficient Pose Estimation in Videos",
    year = "2017",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204836433",
    id = "record",
    doi = "10.48550/arXiv.1712.09184"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204839800,
    title = "Data Distillation: Towards Omni-Supervised Learning",
    year = "2017",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204839800",
    id = "record",
    doi = "10.48550/arXiv.1712.04440"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204833051,
    title = "Embodied Question Answering",
    year = "2017",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204833051",
    id = "record",
    doi = "10.48550/arXiv.1711.11543"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789744000.10,
    title = "2017 IEEE International Conference on Computer Vision (ICCV)",
    chapter = "Mask R-CNN",
    year = "2017",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789744000.10",
    id = "record",
    isbn = "978-1-5386-1032-9",
    doi = "10.1109/iccv.2017.322"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789739000.9,
    title = "2017 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)",
    chapter = "Learn2Smile: Learning non-verbal interaction through observation",
    year = "2017",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789739000.9",
    id = "record",
    isbn = "978-1-5386-2682-5",
    doi = "10.1109/iros.2017.8206272"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204829682,
    title = "Detecting and Recognizing Human-Object Interactions",
    year = "2017",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204829682",
    id = "record"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204843170,
    title = "Mask R-CNN",
    year = "2017",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204843170",
    id = "record",
    doi = "10.48550/arXiv.1703.06870"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789734000.8,
    title = "Computer Vision – ECCV 2016",
    chapter = "Chained Predictions Using Convolutional Neural Networks",
    year = "2016",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789734000.8",
    id = "record",
    isbn = "9783319464923",
    doi = "10.1007/978-3-319-46493-0\_44"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204846541,
    title = "Chained Predictions Using Convolutional Neural Networks",
    year = "2016",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204846541",
    id = "record",
    doi = "10.48550/arXiv.1605.02346"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789729000.6,
    title = "2015 IEEE International Conference on Computer Vision (ICCV)",
    chapter = "Contextual Action Recognition with R*CNN",
    year = "2015",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789729000.6",
    id = "record",
    isbn = "978-1-4673-8391-2",
    doi = "10.1109/iccv.2015.129"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789725000.5,
    title = "2015 IEEE International Conference on Computer Vision (ICCV)",
    chapter = "Actions and Attributes from Wholes and Parts",
    year = "2015",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789725000.5",
    id = "record",
    isbn = "978-1-4673-8391-2",
    doi = "10.1109/iccv.2015.284"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789721000.4,
    title = "2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)",
    chapter = "Finding action tubes",
    year = "2015",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789721000.4",
    id = "record",
    isbn = "978-1-4673-6964-0",
    doi = "10.1109/cvpr.2015.7298676"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204849905,
    title = "Contextual Action Recognition with R*CNN",
    year = "2015",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204849905",
    id = "record",
    doi = "10.48550/arXiv.1505.01197"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204853268,
    title = "Actions and Attributes from Wholes and Parts",
    year = "2014",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204853268",
    id = "record",
    doi = "10.48550/arXiv.1412.2604"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204856628,
    title = "Finding Action Tubes",
    year = "2014",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204856628",
    id = "record",
    doi = "10.48550/arXiv.1411.6031"
}


@other{https://resolver.caltech.edu/CaltechAUTHORS:20221219-204859995,
    title = "R-CNNs for Pose Estimation and Action Detection",
    year = "2014",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221219-204859995",
    id = "record",
    doi = "10.48550/arXiv.1406.5212"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789716000.3,
    title = "2014 IEEE Conference on Computer Vision and Pattern Recognition",
    chapter = "Using k-Poselets for Detecting People and Localizing Their Keypoints",
    year = "2014",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789716000.3",
    id = "record",
    isbn = "978-1-4799-5118-5",
    doi = "10.1109/cvpr.2014.458"
}


@inbook{https://resolver.caltech.edu/CaltechAUTHORS:20221215-789688000.2,
    title = "2013 IEEE Conference on Computer Vision and Pattern Recognition",
    chapter = "Articulated Pose Estimation Using Discriminative Armlet Classifiers",
    year = "2013",
    url = "https://resolver.caltech.edu/CaltechAUTHORS:20221215-789688000.2",
    id = "record",
    isbn = "978-1-5386-5672-3",
    doi = "10.1109/cvpr.2013.429"
}