@inproceedings{2d0e27fc5bd14cd58e1e81888ab6ef3a,
title = "A data lineage model for distributed sub-image processing",
abstract = "An important challenge facing e-Science is the development of scalable systems and analysis techniques that allow client applications to locate data and services in increasingly large-scale distributed environments. e-Science Systems should achieve three main goals: (i) efficient and selective processing of data, (ii) support network collaboration without clogging distribution networks; and (iii) allow transparency of experiments through repeatability and verifiability of experiments. Several systems have addressed limited combinations of these properties, but we address all three in this work. We describe the architecture and implementation of such a framework in Astro-WISE, an astronomical approach to distributed data processing, discovery and retrieval of datasets that achieves scalability via dynamic linking (data lineage) maintained within the system. We show that lineage data collected during the processing and analysis of datasets can be reused to perform selective reprocessing(at sub-image level)ondatasets while the remainder of the dataset is untouched, a rather difficult process to automate without lineage.",
keywords = "data lineage, data reduction, provenance, scientific computing, subimage processing, target processing",
author = "Johnson Mwebaze and John McFarland and Danny Booxhorn and Edwin Valentijn",
year = "2010",
doi = "10.1145/1899503.1899527",
language = "English",
isbn = "9781605589503",
series = "ACM International Conference Proceeding Series",
publisher = "ACM Press Digital Library",
pages = "209--219",
booktitle = "Fountains of Computing Research - Proceedings of SAICSIT 2010 Annual Research Conference of the South African Institute of Computer Scientist and Information Technologists",
note = "2010 Annual Research Conference of the South African Institute of Computer Scientist and Information Technologists, SAICSIT 2010 ; Conference date: 11-10-2010 Through 13-10-2010",
}