[
    {
        "id": "authors:pvmcz-13r80",
        "collection": "authors",
        "collection_id": "pvmcz-13r80",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20230526-662984000.7",
        "type": "book_section",
        "title": "Image Reconstruction without Explicit Priors",
        "book_title": "2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)",
        "author": [
            {
                "family_name": "Gao",
                "given_name": "Angela F.",
                "orcid": "0000-0001-8574-8728",
                "clpid": "Gao-Angela-F"
            },
            {
                "family_name": "Leong",
                "given_name": "Oscar",
                "orcid": "0000-0003-1737-3981",
                "clpid": "Leong-Oscar"
            },
            {
                "family_name": "Sun",
                "given_name": "He",
                "orcid": "0000-0003-1526-6787",
                "clpid": "Sun-He"
            },
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            }
        ],
        "abstract": "We consider solving ill-posed imaging inverse problems without access to an explicit image prior or ground-truth examples. An overarching challenge in inverse problems is that there are many undesired images that fit to the observed measurements, thus requiring image priors to constrain the space of possible solutions to more plausible reconstructions. However, in many applications it is difficult or potentially impossible to obtain ground-truth images to learn an image prior. Thus, inaccurate priors are often used, which inevitably result in biased solutions. Rather than solving an inverse problem using priors that encode the explicit structure of any one image, we propose to solve a set of inverse problems jointly by incorporating prior constraints on the collective structure of the underlying images. The key assumption of our work is that the ground-truth images we aim to reconstruct share common, low-dimensional structure. We show that such a set of inverse problems can be solved simultaneously by learning a shared image generator with a low-dimensional latent space. The parameters of the generator and latent embedding are learned by maximizing a proxy for the Evidence Lower Bound (ELBO). Once learned, the generator and latent embeddings can be combined to provide reconstructions for each inverse problem. The framework we propose can handle general forward model corruptions, and we show that measurements derived from only a few ground-truth images (O(10)) are sufficient for image reconstruction without explicit priors.",
        "doi": "10.1109/icassp49357.2023.10096515",
        "isbn": "9781728163277",
        "publisher": "IEEE",
        "place_of_publication": "Piscataway, NJ",
        "publication_date": "2023-06"
    },
    {
        "id": "authors:jmn81-k7q70",
        "collection": "authors",
        "collection_id": "jmn81-k7q70",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20221026-200931912",
        "type": "book_section",
        "title": "DeepGEM: Generalized Expectation-Maximization for Blind Inversion",
        "book_title": "35th Conference on Neural Information Processing Systems",
        "author": [
            {
                "family_name": "Gao",
                "given_name": "Angela F.",
                "orcid": "0000-0001-8574-8728",
                "clpid": "Gao-Angela-F"
            },
            {
                "family_name": "Castellanos",
                "given_name": "Jorge C.",
                "orcid": "0000-0002-0103-6430",
                "clpid": "Castellanos-Jorge-C"
            },
            {
                "family_name": "Yue",
                "given_name": "Yisong",
                "orcid": "0000-0001-9127-1989",
                "clpid": "Yue-Yisong"
            },
            {
                "family_name": "Ross",
                "given_name": "Zachary E.",
                "orcid": "0000-0002-6343-8400",
                "clpid": "Ross-Z-E"
            },
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            }
        ],
        "contributor": [
            {
                "family_name": "Ranzato",
                "given_name": "M.",
                "clpid": "Ranzato-M"
            },
            {
                "family_name": "Beygelzimer",
                "given_name": "A.",
                "clpid": "Beygelzimer-A"
            },
            {
                "family_name": "Dauphin",
                "given_name": "Y.",
                "clpid": "Dauphin-Y"
            },
            {
                "family_name": "Liang",
                "given_name": "P. S.",
                "clpid": "Liang-P-S"
            },
            {
                "family_name": "Wortman Vaughan",
                "given_name": "J.",
                "orcid": "0000-0002-7807-2018",
                "clpid": "Wortman-Vaughan-J"
            }
        ],
        "abstract": "Typically, inversion algorithms assume that a forward model, which relates a source to its resulting measurements, is known and fixed. Using collected indirect measurements and the forward model, the goal becomes to recover the source. When the forward model is unknown, or imperfect, artifacts due to model mismatch occur in the recovery of the source. In this paper, we study the problem of blind inversion: solving an inverse problem with unknown or imperfect knowledge of the forward model parameters. We propose DeepGEM, a variational Expectation-Maximization (EM) framework that can be used to solve for the unknown parameters of the forward model in an unsupervised manner. DeepGEM makes use of a normalizing flow generative network to efficiently capture complex posterior distributions, which leads to more accurate evaluation of the source's posterior distribution used in EM. We showcase the effectiveness of our DeepGEM approach by achieving strong performance on the challenging problem of blind seismic tomography, where we significantly outperform the standard method used in seismology. We also demonstrate the generality of DeepGEM by applying it to a simple case of blind deconvolution.",
        "isbn": "9781713845393",
        "publisher": "Neural Information Processing Systems foundation",
        "place_of_publication": "La Jolla, CA",
        "publication_date": "2021-12",
        "pages": "1-12"
    },
    {
        "id": "authors:wbj75-1gv55",
        "collection": "authors",
        "collection_id": "wbj75-1gv55",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20220307-188412000",
        "type": "book_section",
        "title": "Inference of Black Hole Fluid-Dynamics from Sparse Interferometric Measurements",
        "book_title": "2021 IEEE/CVF International Conference on Computer Vision (ICCV)",
        "author": [
            {
                "family_name": "Levis",
                "given_name": "Aviad",
                "orcid": "0000-0001-7307-632X",
                "clpid": "Levis-Aviad"
            },
            {
                "family_name": "Lee",
                "given_name": "Daeyoung",
                "clpid": "Lee-Daeyoung"
            },
            {
                "family_name": "Tropp",
                "given_name": "Joel A.",
                "orcid": "0000-0003-1024-1791",
                "clpid": "Tropp-J-A"
            },
            {
                "family_name": "Gammie",
                "given_name": "Charles F.",
                "orcid": "0000-0001-7451-8935",
                "clpid": "Gammie-Charles-F"
            },
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            }
        ],
        "abstract": "We develop an approach to recover the underlying properties of fluid-dynamical processes from sparse measurements. We are motivated by the task of imaging the stochastically evolving environment surrounding black holes, and demonstrate how flow parameters can be estimated from sparse interferometric measurements used in radio astronomical imaging. To model the stochastic flow we use spatio-temporal Gaussian Random Fields (GRFs). The high dimensionality of the underlying source video makes direct representation via a GRF's full covariance matrix intractable. In contrast, stochastic partial differential equations are able to capture correlations at multiple scales by specifying only local interaction coefficients. Our approach estimates the coefficients of a space-time diffusion equation that dictates the stationary statistics of the dynamical process. We analyze our approach on realistic simulations of black hole evolution and demonstrate its advantage over state-of-the-art dynamic black hole imaging techniques.",
        "doi": "10.1109/iccv48922.2021.00234",
        "isbn": "978-1-6654-2812-5",
        "publisher": "IEEE",
        "place_of_publication": "Piscataway, NJ",
        "publication_date": "2021-10",
        "pages": "2320-2329"
    },
    {
        "id": "authors:k65xp-y9147",
        "collection": "authors",
        "collection_id": "k65xp-y9147",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20210510-141401087",
        "type": "book_section",
        "title": "Measurement-Robust Control Barrier Functions: Certainty in Safety with Uncertainty in State",
        "book_title": "2021 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)",
        "author": [
            {
                "family_name": "Cosner",
                "given_name": "Ryan K.",
                "clpid": "Cosner-Ryan-K"
            },
            {
                "family_name": "Singletary",
                "given_name": "Andrew W.",
                "orcid": "0000-0001-6635-4256",
                "clpid": "Singletary-Andrew-W"
            },
            {
                "family_name": "Taylor",
                "given_name": "Andrew J.",
                "orcid": "0000-0002-5990-590X",
                "clpid": "Taylor-Andrew-J"
            },
            {
                "family_name": "Molnar",
                "given_name": "Tam\u00e1s G.",
                "orcid": "0000-0002-9379-7121",
                "clpid": "Moln\u00e1r-Tam\u00e1s-G"
            },
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            },
            {
                "family_name": "Ames",
                "given_name": "Aaron D.",
                "orcid": "0000-0003-0848-3177",
                "clpid": "Ames-A-D"
            }
        ],
        "abstract": "The increasing complexity of modern robotic systems and the environments they operate in necessitates the formal consideration of safety in the presence of imperfect measurements. In this paper we propose a rigorous framework for safety-critical control of systems with erroneous state estimates. We develop this framework by leveraging Control Barrier Functions (CBFs) and unifying the method of Backup Sets for synthesizing control invariant sets with robustness requirements\u2014the end result is the synthesis of Measurement-Robust Control Barrier Functions (MR-CBFs). This provides theoretical guarantees on safe behavior in the presence of imperfect measurements and improved robustness over standard CBF approaches. We demonstrate the efficacy of this framework both in simulation and experimentally on a Segway platform using an onboard stereo-vision camera for state estimation.",
        "doi": "10.1109/IROS51168.2021.9636584",
        "isbn": "978-1-6654-1715-0",
        "publisher": "IEEE",
        "place_of_publication": "Piscataway, NJ",
        "publication_date": "2021-09-27",
        "pages": "6286-6291"
    },
    {
        "id": "authors:7249p-fqn69",
        "collection": "authors",
        "collection_id": "7249p-fqn69",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20210604-142552450",
        "type": "book_section",
        "title": "Deep Probabilistic Imaging: Uncertainty Quantification and Multi-modal Solution Characterization for Computational Imaging",
        "author": [
            {
                "family_name": "Sun",
                "given_name": "He",
                "orcid": "0000-0003-1526-6787",
                "clpid": "Sun-He"
            },
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            }
        ],
        "abstract": "Computational image reconstruction algorithms generally produce a single image without any measure of uncertainty or confidence. Regularized Maximum Likelihood (RML) and feed-forward deep learning approaches for inverse problems typically focus on recovering a point estimate. This is a serious limitation when working with under-determined imaging systems, where it is conceivable that multiple image modes would be consistent with the measured data. Characterizing the space of probable images that explain the observational data is therefore crucial. In this paper, we propose a variational deep probabilistic imaging approach to quantify reconstruction uncertainty. Deep Probabilistic Imaging (DPI) employs an untrained deep generative model to estimate a posterior distribution of an unobserved image. This approach does not require any training data; instead, it optimizes the weights of a neural network to generate image samples that fit a particular measurement dataset. Once the network weights have been learned, the posterior distribution can be efficiently sampled. We demonstrate this approach in the context of interferometric radio imaging, which is used for black hole imaging with the Event Horizon Telescope, and compressed sensing Magnetic Resonance Imaging (MRI).",
        "doi": "10.48550/arXiv.2010.14462",
        "publisher": "Association for the Advancement of Artificial Intelligence",
        "publication_date": "2021-05-18"
    },
    {
        "id": "authors:r5pjt-ezf04",
        "collection": "authors",
        "collection_id": "r5pjt-ezf04",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20200605-134947553",
        "type": "book_section",
        "title": "Learning a Probabilistic Strategy for Computational Imaging Sensor Selection",
        "book_title": "2020 IEEE International Conference on Computational Photography (ICCP)",
        "author": [
            {
                "family_name": "Sun",
                "given_name": "He",
                "clpid": "Sun-He"
            },
            {
                "family_name": "Dalca",
                "given_name": "Adrian V.",
                "orcid": "0000-0002-8422-0136",
                "clpid": "Dalca-Adrian-V"
            },
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            }
        ],
        "abstract": "Optimized sensing is important for computational imaging in low-resource environments, when images must be recovered from severely limited measurements. In this paper, we propose a physics-constrained, fully differentiable, autoencoder that learns a probabilistic sensor-sampling strategy for optimized sensor design. The proposed method learns a system's preferred sampling distribution that characterizes the correlations between different sensor selections as a binary, fully-connected Ising model. The learned probabilistic model is achieved by using a Gibbs sampling inspired network architecture, and is trained end-to-end with a reconstruction network for efficient co-design. The proposed framework is applicable to sensor selection problems in a variety of computational imaging applications. In this paper, we demonstrate the approach in the context of a very-long-baseline-interferometry (VLBI) array design task, where sensor correlations and atmospheric noise present unique challenges. We demonstrate results broadly consistent with expectation, and draw attention to particular structures preferred in the telescope array geometry that can be leveraged to plan future observations and design array expansions.",
        "doi": "10.1109/iccp48838.2020.9105133",
        "isbn": "9781728152301",
        "publisher": "IEEE",
        "place_of_publication": "Piscataway, NJ",
        "publication_date": "2020-04",
        "pages": "1-12"
    },
    {
        "id": "authors:5gqc8-zfw53",
        "collection": "authors",
        "collection_id": "5gqc8-zfw53",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20190404-161219288",
        "type": "book_section",
        "title": "Turning Corners into Cameras: Principles and Methods",
        "book_title": "2017 IEEE International Conference on Computer Vision (ICCV)",
        "author": [
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            },
            {
                "family_name": "Ye",
                "given_name": "Vickie",
                "clpid": "Ye-Vickie"
            },
            {
                "family_name": "Yedidia",
                "given_name": "Adam B.",
                "clpid": "Yedidia-A-B"
            },
            {
                "family_name": "Durand",
                "given_name": "Fredo",
                "clpid": "Durand-F"
            },
            {
                "family_name": "Wornell",
                "given_name": "Gregory W.",
                "clpid": "Wornell-G-W"
            },
            {
                "family_name": "Torralba",
                "given_name": "Antonio",
                "clpid": "Torralba-A"
            },
            {
                "family_name": "Freeman",
                "given_name": "William T.",
                "orcid": "0000-0002-2231-7995",
                "clpid": "Freeman-W-T"
            }
        ],
        "abstract": "We show that walls, and other obstructions with edges, can be exploited as naturally-occurring \"cameras\" that reveal the hidden scenes beyond them. In particular, we demonstrate methods for using the subtle spatio-temporal radiance variations that arise on the ground at the base of a wall's edge to construct a one-dimensional video of the hidden scene behind the wall. The resulting technique can be used for a variety of applications in diverse physical settings. From standard RGB video recordings, we use edge cameras to recover 1-D videos that reveal the number and trajectories of people moving in an occluded scene. We further show that adjacent wall edges, such as those that arise in the case of an open doorway, yield a stereo camera from which the 2-D location of hidden, moving objects can be recovered. We demonstrate our technique in a number of indoor and outdoor environments involving varied floor surfaces and illumination conditions.",
        "doi": "10.1109/iccv.2017.249",
        "isbn": "9781538610329",
        "publisher": "IEEE",
        "place_of_publication": "Piscataway, NJ",
        "publication_date": "2017-10",
        "pages": "2289-2297"
    },
    {
        "id": "authors:mrsap-xv786",
        "collection": "authors",
        "collection_id": "mrsap-xv786",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20190404-161219383",
        "type": "book_section",
        "title": "Multi-Resolution Data Fusion for Super-Resolution Electron Microscopy",
        "book_title": "2017 IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)",
        "author": [
            {
                "family_name": "Sreehari",
                "given_name": "Suhas",
                "clpid": "Sreehari-S"
            },
            {
                "family_name": "Venkatakrishnan",
                "given_name": "S. V.",
                "clpid": "Venkatakrishnan-S-V"
            },
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            },
            {
                "family_name": "Simmons",
                "given_name": "Jeff P.",
                "clpid": "Simmons-J-P"
            },
            {
                "family_name": "Drummy",
                "given_name": "Larry F.",
                "orcid": "0000-0002-6452-5768",
                "clpid": "Drummy-L-F"
            },
            {
                "family_name": "Bouman",
                "given_name": "Charles A.",
                "clpid": "Bouman-C-A"
            }
        ],
        "abstract": "Perhaps surprisingly, all electron microscopy (EM) data collected to date is less than a cubic millimeter - presenting a huge demand in the materials and biological sciences to image at greater speed and lower dosage, while maintaining resolution. Traditional EM imaging based on homogeneous raster scanning severely limits the volume of high-resolution data that can be collected, and presents a fundamental limitation to understanding physical processes such as material deformation and crack propagation. We introduce a multi-resolution data fusion (MDF) method for super-resolution computational EM. Our method combines innovative data acquisition with novel algorithmic techniques to dramatically improve the resolution/volume/speed trade-off. The key to our approach is to collect the entire sample at low resolution, while simultaneously collecting a small fraction of data at high resolution. The high-resolution measurements are then used to create a material-specific model that is used within the \"plug-and-play\" framework to dramatically improve resolution of the low-resolution data. We present results using FEI electron microscope data that demonstrate super-resolution factors of 4x-16x, while substantially maintaining high image quality and reducing dosage.",
        "doi": "10.1109/cvprw.2017.146",
        "isbn": "9781538607336",
        "publisher": "IEEE",
        "place_of_publication": "Piscataway, NJ",
        "publication_date": "2017-07",
        "pages": "1084-1092"
    },
    {
        "id": "authors:08h0f-azh33",
        "collection": "authors",
        "collection_id": "08h0f-azh33",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20190405-160617876",
        "type": "book_section",
        "title": "Population Based Image Imputation",
        "book_title": "Information Processing in Medical Imaging. IPMI 2017",
        "author": [
            {
                "family_name": "Dalca",
                "given_name": "Adrian V.",
                "orcid": "0000-0002-8422-0136",
                "clpid": "Dalca-A-V"
            },
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            },
            {
                "family_name": "Freeman",
                "given_name": "William T.",
                "orcid": "0000-0002-2231-7995",
                "clpid": "Freeman-W-T"
            },
            {
                "family_name": "Rost",
                "given_name": "Natalia S.",
                "clpid": "Rost-N-S"
            },
            {
                "family_name": "Sabuncu",
                "given_name": "Mert R.",
                "orcid": "0000-0002-7068-719X",
                "clpid": "Sabuncu-M-R"
            },
            {
                "family_name": "Golland",
                "given_name": "Polina",
                "clpid": "Golland-P"
            }
        ],
        "contributor": [
            {
                "family_name": "Niethammer",
                "given_name": "Marc",
                "clpid": "Niethammer-M"
            },
            {
                "family_name": "Styner",
                "given_name": "Martin",
                "clpid": "Styner-M"
            },
            {
                "family_name": "Aylward",
                "given_name": "Stephen",
                "clpid": "Aylward-S"
            },
            {
                "family_name": "Zhu",
                "given_name": "Hongtu",
                "clpid": "Zhu-Hongtu"
            },
            {
                "family_name": "Oguz",
                "given_name": "Ipek",
                "clpid": "Oguz-I"
            },
            {
                "family_name": "Yap",
                "given_name": "Pew-Thian",
                "clpid": "Yap-Pew-Thian"
            },
            {
                "family_name": "Shen",
                "given_name": "Dinggang",
                "clpid": "Shen-Dinggang"
            }
        ],
        "abstract": "We present an algorithm for creating high resolution anatomically plausible images consistent with acquired clinical brain MRI scans with large inter-slice spacing. Although large databases of clinical images contain a wealth of information, medical acquisition constraints result in sparse scans that miss much of the anatomy. These characteristics often render computational analysis impractical as standard processing algorithms tend to fail when applied to such images. Highly specialized or application-specific algorithms that explicitly handle sparse slice spacing do not generalize well across problem domains. In contrast, our goal is to enable application of existing algorithms that were originally developed for high resolution research scans to significantly undersampled scans. We introduce a model that captures fine-scale anatomical similarity across subjects in clinical image collections and use it to fill in the missing data in scans with large slice spacing. Our experimental results demonstrate that the proposed method outperforms current upsampling methods and promises to facilitate subsequent analysis not previously possible with scans of this quality.",
        "doi": "10.1007/978-3-319-59050-9_52",
        "isbn": "9783319590493",
        "publisher": "Springer",
        "place_of_publication": "Cham, Switzerland",
        "publication_date": "2017-05-23",
        "pages": "659-671"
    },
    {
        "id": "authors:h9qvb-h4m17",
        "collection": "authors",
        "collection_id": "h9qvb-h4m17",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20190405-161634029",
        "type": "book_section",
        "title": "Visual Dynamics: Probabilistic Future Frame Synthesis via Cross Convolutional Networks",
        "book_title": "Advances in Neural Information Processing Systems (NIPS 2016)",
        "author": [
            {
                "family_name": "Xue",
                "given_name": "Tianfan",
                "clpid": "Xue-Tianfan"
            },
            {
                "family_name": "Wu",
                "given_name": "Jiajun",
                "orcid": "0000-0002-4176-343X",
                "clpid": "Wu-Jiajun"
            },
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            },
            {
                "family_name": "Freeman",
                "given_name": "William T.",
                "orcid": "0000-0002-2231-7995",
                "clpid": "Freeman-W-T"
            }
        ],
        "contributor": [
            {
                "family_name": "Lee",
                "given_name": "Daniel D.",
                "clpid": "Lee-Daniel-D"
            },
            {
                "family_name": "Sugiyama",
                "given_name": "Masashi",
                "clpid": "Sugiyama-Masashi"
            },
            {
                "family_name": "von Luxburg",
                "given_name": "Ulrike",
                "clpid": "von-Luxburg-U"
            },
            {
                "family_name": "Guyon",
                "given_name": "Isabelle",
                "clpid": "Guyon-I"
            },
            {
                "family_name": "Garnett",
                "given_name": "Roman",
                "clpid": "Garnett-R"
            }
        ],
        "abstract": "We study the problem of synthesizing a number of likely future frames from a single input image. In contrast to traditional methods, which have tackled this problem in a deterministic or non-parametric way, we propose a novel approach which models future frames in a probabilistic manner. Our proposed method is therefore able to synthesize multiple possible next frames using the same model. Solving this challenging problem involves low- and high-level image and motion understanding for successful image synthesis. Here, we propose a novel network structure, namely a Cross Convolutional Network, that encodes images as feature maps and motion information as convolutional kernels to aid in synthesizing future frames. In experiments, our model performs well on both synthetic data, such as 2D shapes and animated game sprites, as well as on real-wold video data. We show that our model can also be applied to tasks such as visual analogy-making, and present analysis of the learned network representations.",
        "doi": "10.48550/arXiv.1607.02586",
        "isbn": "9781510838819",
        "publisher": "Neural Information Processing Systems Foundation",
        "place_of_publication": "La Jolla, CA",
        "publication_date": "2016-12"
    },
    {
        "id": "authors:9at3s-nj868",
        "collection": "authors",
        "collection_id": "9at3s-nj868",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20190404-161219475",
        "type": "book_section",
        "title": "Computational Imaging for VLBI Image Reconstruction",
        "book_title": "2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)",
        "author": [
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            },
            {
                "family_name": "Johnson",
                "given_name": "Michael D.",
                "orcid": "0000-0002-4120-3029",
                "clpid": "Johnson-M-D"
            },
            {
                "family_name": "Zoran",
                "given_name": "Daniel",
                "clpid": "Zoran-D"
            },
            {
                "family_name": "Fish",
                "given_name": "Vincent L.",
                "orcid": "0000-0002-7128-9345",
                "clpid": "Fish-V-L"
            },
            {
                "family_name": "Doeleman",
                "given_name": "Sheperd S.",
                "orcid": "0000-0002-9031-0904",
                "clpid": "Doeleman-S-S"
            },
            {
                "family_name": "Freeman",
                "given_name": "William T.",
                "orcid": "0000-0002-2231-7995",
                "clpid": "Freeman-W-T"
            }
        ],
        "abstract": "Very long baseline interferometry (VLBI) is a technique for imaging celestial radio emissions by simultaneously observing a source from telescopes distributed across Earth. The challenges in reconstructing images from fine angular resolution VLBI data are immense. The data is extremely sparse and noisy, thus requiring statistical image models such as those designed in the computer vision community. In this paper we present a novel Bayesian approach for VLBI image reconstruction. While other methods often require careful tuning and parameter selection for different types of data, our method (CHIRP) produces good results under different settings such as low SNR or extended emission. The success of our method is demonstrated on realistic synthetic experiments as well as publicly available real data. We present this problem in a way that is accessible to members of the community, and provide a dataset website (vlbiimaging.csail.mit.edu) that facilitates controlled comparisons across algorithms.",
        "doi": "10.1109/cvpr.2016.105",
        "isbn": "9781467388511",
        "publisher": "IEEE",
        "place_of_publication": "Piscataway, NJ",
        "publication_date": "2016-06",
        "pages": "913-922"
    },
    {
        "id": "authors:k2yby-6dy13",
        "collection": "authors",
        "collection_id": "k2yby-6dy13",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20190405-163101345",
        "type": "book_section",
        "title": "Estimating the Material Properties of Fabric from Video",
        "book_title": "2013 IEEE International Conference on Computer Vision",
        "author": [
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            },
            {
                "family_name": "Xiao",
                "given_name": "Bei",
                "clpid": "Xiao-Bei"
            },
            {
                "family_name": "Battaglia",
                "given_name": "Peter",
                "clpid": "Battaglia-P"
            },
            {
                "family_name": "Freeman",
                "given_name": "William T.",
                "orcid": "0000-0002-2231-7995",
                "clpid": "Freeman-W-T"
            }
        ],
        "abstract": "Passively estimating the intrinsic material properties of deformable objects moving in a natural environment is essential for scene understanding. We present a framework to automatically analyze videos of fabrics moving under various unknown wind forces, and recover two key material properties of the fabric: stiffness and area weight. We extend features previously developed to compactly represent static image textures to describe video textures, such as fabric motion. A discriminatively trained regression model is then used to predict the physical properties of fabric from these features. The success of our model is demonstrated on a new, publicly available database of fabric videos with corresponding measured ground truth material properties. We show that our predictions are well correlated with ground truth measurements of stiffness and density for the fabrics. Our contributions include: (a) a database that can be used for training and testing algorithms for passively predicting fabric properties from video, (b) an algorithm for predicting the material properties of fabric from a video, and (c) a perceptual study of humans' ability to estimate the material properties of fabric from videos and images.",
        "doi": "10.1109/iccv.2013.455",
        "isbn": "9781479928408",
        "publisher": "IEEE",
        "place_of_publication": "Piscataway, NJ",
        "publication_date": "2013-12",
        "pages": "1984-1991"
    },
    {
        "id": "authors:88fbc-3ex36",
        "collection": "authors",
        "collection_id": "88fbc-3ex36",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20190404-161219565",
        "type": "book_section",
        "title": "Training image classifiers with similarity metrics, linear programming, and minimal supervision",
        "book_title": "2012 Conference Record of the Forty Sixth Asilomar Conference on Signals, Systems and Computers (ASILOMAR)",
        "author": [
            {
                "family_name": "Ni",
                "given_name": "Karl",
                "clpid": "Ni-Karl"
            },
            {
                "family_name": "Phelps",
                "given_name": "Ethan",
                "clpid": "Phelps-E"
            },
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            },
            {
                "family_name": "Bliss",
                "given_name": "Nadya",
                "clpid": "Bliss-N"
            }
        ],
        "abstract": "Image classification is a classical computer vision problem with applications to semantic image annotation, querying, and indexing. Recent and effective generative techniques assume Gaussianity, rely on distance metrics, and estimate distributions, but are unfortunately not convex nor keep computational architecture in mind. We propose image content classification through convex linear programming using similarity metrics rather than commonly-used Mahalanobis distances. The algorithm is solved through a hybrid iterative method that takes advantage of optimization space properties. Our optimization problem uses dot products in the feature space exclusively, and therefore can be extended to non-linear kernel functions in the transductive setting.",
        "doi": "10.1109/acssc.2012.6489386",
        "isbn": "9781467350518",
        "publisher": "IEEE",
        "place_of_publication": "Piscataway, NJ",
        "publication_date": "2012-11",
        "pages": "1979-1983"
    },
    {
        "id": "authors:br7bc-cr246",
        "collection": "authors",
        "collection_id": "br7bc-cr246",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20190405-164254906",
        "type": "book_section",
        "title": "RAW camera DPCM compression performance analysis",
        "book_title": "Image Quality and System Performance VIII",
        "author": [
            {
                "family_name": "Bouman",
                "given_name": "Katherine",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            },
            {
                "family_name": "Ramachandra",
                "given_name": "Vikas",
                "clpid": "Ramachandra-V"
            },
            {
                "family_name": "Atanassov",
                "given_name": "Kalin",
                "clpid": "Atanassov-K"
            },
            {
                "family_name": "Aleksic",
                "given_name": "Mickey",
                "clpid": "Aleksic-M"
            },
            {
                "family_name": "Goma",
                "given_name": "Sergio R.",
                "clpid": "Goma-S-R"
            }
        ],
        "contributor": [
            {
                "family_name": "Farnand",
                "given_name": "Susan P.",
                "clpid": "Farnand-S-P"
            },
            {
                "family_name": "Gaykema",
                "given_name": "Frans",
                "clpid": "Gaykema-F"
            }
        ],
        "abstract": "The MIPI standard has adopted DPCM compression for RAW data images streamed from mobile cameras. This DPCM is line based and uses either a simple 1 or 2 pixel predictor. In this paper, we analyze the DPCM compression performance as MTF degradation. To test this scheme's performance, we generated Siemens star images and binarized them to 2-level images. These two intensity values where chosen such that their intensity difference corresponds to those pixel differences which result in largest relative errors in the DPCM compressor. (E.g. a pixel transition from 0 to 4095 corresponds to an error of 6 between the DPCM compressed value and the original pixel value). The DPCM scheme introduces different amounts of error based on the pixel difference. We passed these modified Siemens star chart images to this compressor and compared the compressed images with the original images using IT3 MTF response plots for slanted edges. Further, we discuss the PSF influence on DPCM error and its propagation through the image processing pipe.",
        "doi": "10.1117/12.872637",
        "isbn": "9780819484048",
        "publisher": "Society of Photo-optical Instrumentation Engineers (SPIE)",
        "place_of_publication": "Bellingham, WA",
        "publication_date": "2011-01-24",
        "pages": "Art. No. 78670N"
    },
    {
        "id": "authors:qkbw8-03e95",
        "collection": "authors",
        "collection_id": "qkbw8-03e95",
        "cite_using_url": "https://resolver.caltech.edu/CaltechAUTHORS:20190404-161219749",
        "type": "book_section",
        "title": "A low complexity method for detection of text area in natural images",
        "book_title": "2010 IEEE International Conference on Acoustics, Speech and Signal Processing",
        "author": [
            {
                "family_name": "Bouman",
                "given_name": "Katherine L.",
                "orcid": "0000-0003-0077-4367",
                "clpid": "Bouman-K-L"
            },
            {
                "family_name": "Abdollahian",
                "given_name": "Golnaz",
                "clpid": "Abdollahian-G"
            },
            {
                "family_name": "Boutin",
                "given_name": "Mireille",
                "clpid": "Boutin-M"
            },
            {
                "family_name": "Delp",
                "given_name": "Edward J.",
                "clpid": "Delp-E-J"
            }
        ],
        "abstract": "We propose a low complexity method for segmentation of text regions in natural images. This algorithm is designed for mobile applications (e.g. unmanned or hand-held devices) in which computational and energy resources are limited. No prior assumption is made regarding the text size, font, language, character set or the camera angle. However, the text is assumed to be located on a piecewise homogeneous background with a contrasting color. We have deployed our method on a Nokia N800 Internet tablet as part of a system for automatic detection and translation of outdoor signs. Our experiments show that the 0.3 megapixel images taken by the phone camera can be accurately segmented within the device in a fraction of a second.",
        "doi": "10.1109/icassp.2010.5495331",
        "isbn": "9781424442959",
        "publisher": "IEEE",
        "place_of_publication": "Piscataway, NJ",
        "publication_date": "2010-03",
        "pages": "1050-1053"
    }
]