{"corpus_id":1850394,"paper_sha":"55554a329bff32907ab384358be08d0ac753f416","doi":"10.1109/CVPRW.2016.8","arxiv_id":"1605.01923","pmid":null,"pmcid":null,"mag_id":2963070315,"dblp_id":"conf/cvpr/MostegelRFB16a","acl_id":null,"title":"UAV-Based Autonomous Image Acquisition with Multi-view Stereo Quality Assurance by Confidence Prediction","year":2016,"publication_date":"2016-05-06","venue":"2016 IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)","journal":{"name":"2016 IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)","pages":"1-10","volume":null},"journal_issn":null,"journal_title":null,"publication_types":["JournalArticle","Conference"],"pubmed_pub_types":null,"s2_fields_of_study":["Computer Science","Engineering"],"reference_count":54,"citation_count":43,"influential_citation_count":2,"is_open_access":true,"arxiv_categories":["cs.CV","cs.RO"],"arxiv_license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","arxiv_journal_ref":null,"mesh_headings":null,"chemicals":null,"comments_corrections":null,"source_flags":1,"s2_open_access_pdf_url":"https://arxiv.org/pdf/1605.01923","s2_open_access_landing_url":"https://www.semanticscholar.org/paper/55554a329bff32907ab384358be08d0ac753f416","s2_open_access_license":null,"s2_open_access_status":"GREEN","pmc_open_access_pdf_url":null,"pmc_open_access_landing_url":null,"pmc_open_access_license":null,"pmc_open_access_status":null,"unpaywall_open_access_pdf_url":null,"unpaywall_open_access_landing_url":null,"unpaywall_open_access_license":null,"unpaywall_open_access_status":null,"abstract":"In this paper we present an autonomous system for acquiring close-range high-resolution images that maximize the quality of a later-on 3D reconstruction with respect to coverage, ground resolution and 3D uncertainty. In contrast to previous work, our system uses the already acquired images to predict the confidence in the output of a dense multi-view stereo approach without executing it. This confidence encodes the likelihood of a successful reconstruction with respect to the observed scene and potential camera constellations. Our prediction module runs in real-time and can be trained without any externally recorded ground truth. We use the confidence prediction for on-site quality assurance and for planning further views that are tailored for a specific multi-view stereo approach with respect to the given scene. We demonstrate the capabilities of our approach with an autonomous Unmanned Aerial Vehicle (UAV) in a challenging outdoor scenario.","claims":[{"public_id":"cl_e685ce9a47221f069561311daa1125dd","status":"active","text":"An autonomous image acquisition system maximizes the quality of 3D reconstruction with respect to coverage, ground resolution, and 3D uncertainty by acquiring close-range high-resolution images.","confidence":0.85,"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/claims/cl_e685ce9a47221f069561311daa1125dd"},{"public_id":"cl_678b782eb7ff06fe2bf77bc9fd3db5c5","status":"active","text":"Confidence in the output of a dense multi-view stereo approach is predicted directly from already-acquired images without executing the multi-view stereo reconstruction, in contrast to previous approaches.","confidence":0.9,"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/claims/cl_678b782eb7ff06fe2bf77bc9fd3db5c5"},{"public_id":"cl_416fc25d7b7a3c55d4928fa3e07d9430","status":"active","text":"Confidence prediction is used for on-site quality assurance and for planning further views tailored to a specific multi-view stereo approach and scene.","confidence":0.8,"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/claims/cl_416fc25d7b7a3c55d4928fa3e07d9430"},{"public_id":"cl_915e5d931a1443498ea08e6601b5e358","status":"active","text":"The confidence prediction module runs in real time and can be trained without any externally recorded ground truth.","confidence":0.85,"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/claims/cl_915e5d931a1443498ea08e6601b5e358"},{"public_id":"cl_8d2fe49ca95f4174362f5a0b5481cdba","status":"active","text":"The system's capabilities are demonstrated using an autonomous Unmanned Aerial Vehicle in a challenging outdoor scenario.","confidence":0.75,"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/claims/cl_8d2fe49ca95f4174362f5a0b5481cdba"}],"concepts":[{"public_id":"co_014105891de1fb4598ea1be5aeca46ed","status":"active","name":"autonomous image acquisition system","description":"An onboard system that autonomously captures close-range high-resolution images during UAV operation for later 3D reconstruction.","types":["system"],"aliases":[],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_014105891de1fb4598ea1be5aeca46ed"},{"public_id":"co_107cb2d583fc4245079bc358be0e4c05","status":"active","name":"camera constellations","description":"Spatial arrangements of camera viewpoints considered when predicting reconstruction confidence.","types":["concept"],"aliases":[],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_107cb2d583fc4245079bc358be0e4c05"},{"public_id":"co_24423748581a47ee6b2ffff09af41331","status":"active","name":"ground truth","description":"Externally recorded reference data that can be used to train or validate prediction models.","types":["data"],"aliases":[],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_24423748581a47ee6b2ffff09af41331"},{"public_id":"co_253e267b55434cc4791288e97782da4e","status":"active","name":"ground resolution","description":"A measure of the spatial detail captured per pixel relative to the ground in acquired images.","types":["metric"],"aliases":[],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_253e267b55434cc4791288e97782da4e"},{"public_id":"co_2fa336527b6d1d4a3866aaa3892901b6","status":"active","name":"3D reconstruction","description":"The process of building a three-dimensional model of a scene from acquired images.","types":["task"],"aliases":[],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_2fa336527b6d1d4a3866aaa3892901b6"},{"public_id":"co_2fc21f075c378b84c282f755b35d3eae","status":"active","name":"Unmanned Aerial Vehicle","description":"An autonomous flying platform used to acquire images of the scene from the air.","types":["platform"],"aliases":["UAV"],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_2fc21f075c378b84c282f755b35d3eae"},{"public_id":"co_31a276ac1d7eacec13cf24c0e9844af0","status":"active","name":"on-site quality assurance","description":"Real-time assessment of acquisition or reconstruction quality performed during data collection in the field.","types":["process"],"aliases":[],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_31a276ac1d7eacec13cf24c0e9844af0"},{"public_id":"co_458c81392291f3407f1a258f90aa7b16","status":"active","name":"coverage","description":"A measure of how completely the scene is captured by the set of acquired images.","types":["metric"],"aliases":[],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_458c81392291f3407f1a258f90aa7b16"},{"public_id":"co_57ef5de187a98e69db7c861be5a3ee94","status":"active","name":"confidence prediction","description":"A module that estimates the likelihood of a successful multi-view stereo reconstruction directly from acquired images, without running the reconstruction.","types":["method"],"aliases":["prediction module"],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_57ef5de187a98e69db7c861be5a3ee94"},{"public_id":"co_a05d50d748fdadcc2e955d42aec3a5da","status":"active","name":"3D uncertainty","description":"A measure of the uncertainty associated with the reconstructed 3D geometry.","types":["metric"],"aliases":[],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_a05d50d748fdadcc2e955d42aec3a5da"},{"public_id":"co_a097c80802422d3e2316b906285b50b5","status":"active","name":"dense multi-view stereo","description":"A dense reconstruction approach that estimates 3D scene geometry from multiple overlapping images.","types":["method"],"aliases":["multi-view stereo approach"],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_a097c80802422d3e2316b906285b50b5"},{"public_id":"co_f51a22cbdc086f0da53848f10eee4cbe","status":"active","name":"view planning","description":"The task of selecting further camera viewpoints to improve scene coverage and reconstruction quality.","types":["task"],"aliases":[],"contributors":[{"id":17,"public_id":"322360f1c1","public_label":"Killer Whale (322360f1c1)","roles":["extraction"],"url":"https://sah.borca.ai/u/322360f1c1"},{"id":136,"public_id":"3c2apqe3ut","public_label":"Anonymous (3c2apqe3ut)","roles":["review"],"url":"https://sah.borca.ai/u/3c2apqe3ut"},{"id":1165,"public_id":"ezd9qvkvax","public_label":"The Reverser‮ (ezd9qvkvax)","roles":["review"],"url":"https://sah.borca.ai/u/ezd9qvkvax"}],"url":"https://sah.borca.ai/concepts/co_f51a22cbdc086f0da53848f10eee4cbe"}],"external_ids":{"DOI":"10.1109/CVPRW.2016.8","ArXiv":"1605.01923","PubMed":null,"PubMedCentral":null,"MAG":2963070315,"DBLP":"conf/cvpr/MostegelRFB16a","ACL":null},"open_access":{"is_open_access":true,"pdf_url":"https://arxiv.org/pdf/1605.01923","landing_url":"https://www.semanticscholar.org/paper/55554a329bff32907ab384358be08d0ac753f416","source":"semantic_scholar","pdf_url_source":"semantic_scholar_open_access_pdf","license":null,"status":"GREEN","reason":null},"reference_availability":{"status":"available","references_indexed":true,"full_text_available":true,"full_text_source":"arxiv","count_basis":"semantic_scholar_metadata","extraction_status":"not_applicable","reason":null},"source":{"provider":"episteme2","base_corpus":"semantic_scholar_dump","freshness_mode":"unknown","basis":["semantic_scholar_metadata","postgres_metadata"],"limits":["paper metadata is based on indexed upstream scholarly datasets","claims and concepts are available only for extracted papers","absence of claims or concepts means no extracted graph data is available in this response"],"status":"available","degraded":false,"degraded_reasons":[],"diagnostics":{"status":"available","degraded":false,"degraded_reasons":[],"metadata_status":"available","graph_status":"available","abstract_status":"available"},"source_flags":1},"paper_id":631002,"paper_uid":"7a9a718d-48b0-49a2-b4fc-a0fe602cc25a","canonical_identity":{"paper_id":631002,"paper_uid":"7a9a718d-48b0-49a2-b4fc-a0fe602cc25a","identity_status":"available","lookup_basis":"semantic_scholar_external_id","compatibility_path":"corpus_id"},"url":"https://sah.borca.ai/papers/1850394"}