@inproceedings{0073b6aba4cb4bbca7ded988b38c21e3,
title = "Preservation of Manual Changes and Provenance for Data Quality using the Nano Version Control Repo",
abstract = "A new data structure called the Nano Version Control (NanoVC) repo emerges from computer science and the software industry. This data structure efficiently encodes entities at the nano-scale of the modelling spectrum and stores the provenance for that entity. The repo provides an intuitive representation of the history and data-lineage of the entity. Some provenance information can be computed on demand because of the repo structure. A simple algorithm for preservation of manual changes in the light of new data and changing algorithms utilizes the commit history in the repo to give us a sustainable way to merge information while keeping the provenance intact.",
keywords = "data quality, data-lineage, provenance",
author = "Lukasz MacHowski and Tshilidzi Marwala",
note = "Publisher Copyright: {\textcopyright} 2021 IEEE.; 2021 International Conference on Computational Science and Computational Intelligence, CSCI 2021 ; Conference date: 15-12-2021 Through 17-12-2021",
year = "2021",
doi = "10.1109/CSCI54926.2021.00356",
language = "English",
series = "Proceedings - 2021 International Conference on Computational Science and Computational Intelligence, CSCI 2021",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "1905--1911",
booktitle = "Proceedings - 2021 International Conference on Computational Science and Computational Intelligence, CSCI 2021",
address = "United States",
}