The Internet of Things is applied in many domains and collects vast amounts of data. This data provides access to a lot of knowledge when analyzed comprehensively. However, advanced analysis techniques such as predictive or prescriptive analytics require access to both, history data, i.e., long-term persisted data, and real-time data as well as a joint view on both types of data. State-of-the-art hybrid processing architectures for big data—namely, the Lambda and the Kappa Architecture—support the processing of history data and real-time data. However, they lack of a tight coupling of the two processing modes. That is, the user has to do a lot of work manually in order to enable a comprehensive analysis of the data. For instance, the user has to combine the results of both processing modes or apply knowledge from one processing mode to the other. Therefore, we introduce a novel hybrid processing architecture for big data, called BRAID. BRAID intertwines the processing of history data and real-time data by adding communication channels between the batch engine and the stream engine. This enables to carry out comprehensive analyses automatically at a reasonable overhead.
%0 Conference Paper
%1 data_18_braid
%A Giebler, Corinna
%A Stach, Christoph
%A Schwarz, Holger
%A Mitschang, Bernhard
%B Proceedings of the 7ᵗʰ International Conference on Data Science, Technology and Applications
%C Porto
%D 2018
%E Bernardino, Jorge
%E Quix, Christoph
%I SciTePress
%K Big_Data IoT Kappa_Architecture Lambda_Architecture batch_processing stream_processing
%P 294–301
%R 10.5220/0006861802940301
%T BRAID — A Hybrid Processing Architecture for Big Data
%V 1
%X The Internet of Things is applied in many domains and collects vast amounts of data. This data provides access to a lot of knowledge when analyzed comprehensively. However, advanced analysis techniques such as predictive or prescriptive analytics require access to both, history data, i.e., long-term persisted data, and real-time data as well as a joint view on both types of data. State-of-the-art hybrid processing architectures for big data—namely, the Lambda and the Kappa Architecture—support the processing of history data and real-time data. However, they lack of a tight coupling of the two processing modes. That is, the user has to do a lot of work manually in order to enable a comprehensive analysis of the data. For instance, the user has to combine the results of both processing modes or apply knowledge from one processing mode to the other. Therefore, we introduce a novel hybrid processing architecture for big data, called BRAID. BRAID intertwines the processing of history data and real-time data by adding communication channels between the batch engine and the stream engine. This enables to carry out comprehensive analyses automatically at a reasonable overhead.
%@ 978-989-758-318-6
@inproceedings{data_18_braid,
abstract = {The Internet of Things is applied in many domains and collects vast amounts of data. This data provides access to a lot of knowledge when analyzed comprehensively. However, advanced analysis techniques such as predictive or prescriptive analytics require access to both, history data, i.e., long-term persisted data, and real-time data as well as a joint view on both types of data. State-of-the-art hybrid processing architectures for big data—namely, the Lambda and the Kappa Architecture—support the processing of history data and real-time data. However, they lack of a tight coupling of the two processing modes. That is, the user has to do a lot of work manually in order to enable a comprehensive analysis of the data. For instance, the user has to combine the results of both processing modes or apply knowledge from one processing mode to the other. Therefore, we introduce a novel hybrid processing architecture for big data, called BRAID. BRAID intertwines the processing of history data and real-time data by adding communication channels between the batch engine and the stream engine. This enables to carry out comprehensive analyses automatically at a reasonable overhead.},
added-at = {2020-09-21T11:45:55.000+0200},
address = {Porto},
author = {Giebler, Corinna and Stach, Christoph and Schwarz, Holger and Mitschang, Bernhard},
biburl = {https://puma.ub.uni-stuttgart.de/bibtex/2de82d963740455021ba76df683c81e3e/christophstach},
booktitle = {Proceedings of the 7ᵗʰ International Conference on Data Science, Technology and Applications},
doi = {10.5220/0006861802940301},
editor = {Bernardino, Jorge and Quix, Christoph},
interhash = {ffd044502fcab972628a4cbc95b855f7},
intrahash = {de82d963740455021ba76df683c81e3e},
isbn = {978-989-758-318-6},
keywords = {Big_Data IoT Kappa_Architecture Lambda_Architecture batch_processing stream_processing},
month = jun,
pages = {294–301},
publisher = {SciTePress},
series = {DATA '18},
timestamp = {2020-09-21T09:45:55.000+0200},
title = {BRAID — A Hybrid Processing Architecture for Big Data},
volume = 1,
year = 2018
}