@article{Kumar Mondal-2021-Large,
title = "Large Scale Image Registration Utilizing Data-Tunneling in the MapReduce Cluster",
author = "Mondal, Amit Kumar and
Roy, Banani and
Roy, Chanchal K. and
Schneider, Kevin A.",
journal = "Lecture Notes on Data Engineering and Communications Technologies",
year = "2021",
publisher = "Springer Singapore",
url = "https://gwf-uwaterloo.github.io/gwf-publications/G21-27001",
doi = "10.1007/978-981-16-6636-0_14",
pages = "167--180",
abstract = "Applications of image registration tasks are computation-intensive, memory-intensive, and communication-intensive. Robust efforts are required on error recovery and re-usability of both the data and the operations, along with performance optimization. Considering these, we explore various programming models aiming to minimize the folding operations (such as join and reduce) which are the primary candidates of data shuffling, concurrency bugs and expensive communication in a distributed cluster. Particularly, we analyze modular MapReduce execution of an image registration pipeline (IRP) with the external and internal data (data-tunneling) flow mechanism and compare them with the compact model. Experimental analyzes with the ComputeCanada cluster and a crop field data-sets containing 1000 images show that these design options are valuable for large-scale IRPs executed with a MapReduce cluster. Additionally, we present an effectiveness measurement metric to analyze the impact of a design model for the Big IRP, accumulating the error-recovery and re-usability metrics along with the data size and execution time. Our explored design models and their performance analysis can serve as a benchmark for the researchers and application developers who deploy large-scale image registration and other image processing tasks.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="KumarMondal-2021-Large">
<titleInfo>
<title>Large Scale Image Registration Utilizing Data-Tunneling in the MapReduce Cluster</title>
</titleInfo>
<name type="personal">
<namePart type="given">Amit</namePart>
<namePart type="given">Kumar</namePart>
<namePart type="family">Mondal</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Banani</namePart>
<namePart type="family">Roy</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Chanchal</namePart>
<namePart type="given">K</namePart>
<namePart type="family">Roy</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Kevin</namePart>
<namePart type="given">A</namePart>
<namePart type="family">Schneider</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2021</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<genre authority="bibutilsgt">journal article</genre>
<relatedItem type="host">
<titleInfo>
<title>Lecture Notes on Data Engineering and Communications Technologies</title>
</titleInfo>
<originInfo>
<issuance>continuing</issuance>
<publisher>Springer Singapore</publisher>
</originInfo>
<genre authority="marcgt">periodical</genre>
<genre authority="bibutilsgt">academic journal</genre>
</relatedItem>
<abstract>Applications of image registration tasks are computation-intensive, memory-intensive, and communication-intensive. Robust efforts are required on error recovery and re-usability of both the data and the operations, along with performance optimization. Considering these, we explore various programming models aiming to minimize the folding operations (such as join and reduce) which are the primary candidates of data shuffling, concurrency bugs and expensive communication in a distributed cluster. Particularly, we analyze modular MapReduce execution of an image registration pipeline (IRP) with the external and internal data (data-tunneling) flow mechanism and compare them with the compact model. Experimental analyzes with the ComputeCanada cluster and a crop field data-sets containing 1000 images show that these design options are valuable for large-scale IRPs executed with a MapReduce cluster. Additionally, we present an effectiveness measurement metric to analyze the impact of a design model for the Big IRP, accumulating the error-recovery and re-usability metrics along with the data size and execution time. Our explored design models and their performance analysis can serve as a benchmark for the researchers and application developers who deploy large-scale image registration and other image processing tasks.</abstract>
<identifier type="citekey">Kumar Mondal-2021-Large</identifier>
<identifier type="doi">10.1007/978-981-16-6636-0_14</identifier>
<location>
<url>https://gwf-uwaterloo.github.io/gwf-publications/G21-27001</url>
</location>
<part>
<date>2021</date>
<extent unit="page">
<start>167</start>
<end>180</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Journal Article
%T Large Scale Image Registration Utilizing Data-Tunneling in the MapReduce Cluster
%A Mondal, Amit Kumar
%A Roy, Banani
%A Roy, Chanchal K.
%A Schneider, Kevin A.
%J Lecture Notes on Data Engineering and Communications Technologies
%D 2021
%I Springer Singapore
%F KumarMondal-2021-Large
%X Applications of image registration tasks are computation-intensive, memory-intensive, and communication-intensive. Robust efforts are required on error recovery and re-usability of both the data and the operations, along with performance optimization. Considering these, we explore various programming models aiming to minimize the folding operations (such as join and reduce) which are the primary candidates of data shuffling, concurrency bugs and expensive communication in a distributed cluster. Particularly, we analyze modular MapReduce execution of an image registration pipeline (IRP) with the external and internal data (data-tunneling) flow mechanism and compare them with the compact model. Experimental analyzes with the ComputeCanada cluster and a crop field data-sets containing 1000 images show that these design options are valuable for large-scale IRPs executed with a MapReduce cluster. Additionally, we present an effectiveness measurement metric to analyze the impact of a design model for the Big IRP, accumulating the error-recovery and re-usability metrics along with the data size and execution time. Our explored design models and their performance analysis can serve as a benchmark for the researchers and application developers who deploy large-scale image registration and other image processing tasks.
%R 10.1007/978-981-16-6636-0_14
%U https://gwf-uwaterloo.github.io/gwf-publications/G21-27001
%U https://doi.org/10.1007/978-981-16-6636-0_14
%P 167-180
Markdown (Informal)
[Large Scale Image Registration Utilizing Data-Tunneling in the MapReduce Cluster](https://gwf-uwaterloo.github.io/gwf-publications/G21-27001) (Mondal et al., GWF 2021)
ACL
- Amit Kumar Mondal, Banani Roy, Chanchal K. Roy, and Kevin A. Schneider. 2021. Large Scale Image Registration Utilizing Data-Tunneling in the MapReduce Cluster. Lecture Notes on Data Engineering and Communications Technologies:167–180.