@inproceedings{5d19064ec9d34bf8b4aa7c0df787d95a,
title = "Capturing interactive data transformation operations using provenance workflows",
abstract = "The ready availability of data is leading to the increased opportunity of their re-use for new applications and for analyses. Most of these data are not necessarily in the format users want, are usually heterogeneous, and highly dynamic, and this necessitates data transformation efforts to re-purpose them. Interactive data transformation (IDT) tools are becoming easily available to lower these barriers to data transformation efforts. This paper describes a principled way to capture data lineage of interactive data transformation processes. We provide a formal model of IDT, its mapping to a provenance representation, and its implementation and validation on Google Refine. Provision of the data transformation process sequences allows assessment of data quality and ensures portability between IDT and other data transformation platforms. The proposed model showed a high level of coverage against a set of requirements used for evaluating systems that provide provenance management solutions.",
keywords = "Data consumption, Data publication, Extract-Transform-Load, Interactive data transformation, Linked Data, Provenance, Public open data, Semantic Web, Workflow",
author = "Tope Omitola and Andr{\'e} Freitas and Edward Curry and S{\'e}an O{\textquoteright}Riain and Nicholas Gibbins and Nigel Shadbolt",
note = "Publisher Copyright: {\textcopyright} Springer-Verlag Berlin Heidelberg 2015.; Extended Semantic Web Conference, ESWC 2012 ; Conference date: 27-05-2012 Through 31-05-2012",
year = "2015",
doi = "10.1007/978-3-662-46641-4_3",
language = "English",
isbn = "9783662466407",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer-Verlag",
pages = "29--42",
editor = "Alexandre Passant and Barry Norton and Valle, {Emanuele Della} and Raphael Troncy and Irini Fundulaki and Elena Simperl and Dunja Mladenic",
booktitle = "The Semantic Web",
}