@inproceedings{9dbb62ad3a3e4facbf2fa70884c099f4,
title = "The schema last approach to data fusion",
abstract = "Big Data presents new challenges that require new and novel approaches in order to resolve the problems associated with the variability and variety of data obtained from multiple sources. This paper focuses on how to manage variety and the eclectic nature of big data using a technique known as 'Schema Last'. The 'Schema Last' approach is a frame work which defers the application of a descriptive model until it is required. This paper also provides a formal definition of the 'Schema Last' methodology and demonstrates the effectiveness over the more traditional Extract- Transform-Load methodologies employed in many organizations. The 'Schema Last' approach can be used as input to Map Reduction, Index creation and various data mining techniques. Ultimately, the Schema Last approach provides the frame-work to 'fuse' semistructured data into a single coherent view.",
keywords = "Data fusion",
author = "Neil Brittliff and Dharmendra Sharma",
year = "2014",
language = "English",
isbn = "9781921770173",
volume = "158",
series = "Conferences in Research and Practice in Information Technology Series",
publisher = "Australian Computer Society",
pages = "51--58",
editor = "Xue Li and Lin Liu and Kok-Leong Ong and Yanchang Zhao",
booktitle = "Twelfth Australasian Data Mining Conference (AusDM14)",
address = "Australia",
}