@inproceedings{ea10e2e862044786a443e28b8f9abf65,
title = "Stream2Graph: Dynamic Knowledge Graph for Online Learning Applied in Large-scale Network",
abstract = "Knowledge Graphs (KG) are valuable information sources that store knowledge in a domain (healthcare, finance, e-commerce, cyber-security.). Most industrial KGs are dynamic by nature as they are updated regularly with streaming data (customer activity, network traffic, application logs, IT process). However, extracting insights from continuously updated data comes with major challenges, particularly in big data settings. In this paper, we address the following challenges: 1) ingesting heterogeneous data, 2) training and deployment of predictive models on continuously evolving data, and 3) implementation of data pipelines for updating and maintaining the KG in production. We cover multiple aspects of this process, from knowledge collection to its operationalization. We propose Stream2Graph, a stream-based system for building and updating the knowledge base dynamically in real time. Then we show how graph features can be used in downstream online machine learning models. The solution speeds up big data stream learning and knowledge extraction to enhance Graph-based AI applications. Experimental results show the effectiveness of our solution for knowledge base construction and improvement of big data learning capabilities. Using data from Stream2Graph resulted in speedups for training and inference time in the range from 547x to 2000x in downstream ML models. Finally, we provide the lessons learned from applying graph-based online learning on large-scale network processing high-velocity streaming data.",
keywords = "Banking, Big data, Knowledge Graph, Online Machine Learning, Real-Time, Streaming, Telecommunication",
author = "Mariam Barry and Albert Bifet and Raja Chiky and \{El Jaouhari\}, Saad and Jacob Montiel and \{El Ouafi\}, Aissa and Dhiaddedine Yousfi and Eric Guerizec and Aurel Nobial",
note = "Publisher Copyright: {\textcopyright} 2022 IEEE.; 2022 IEEE International Conference on Big Data, Big Data 2022 ; Conference date: 17-12-2022 Through 20-12-2022",
year = "2022",
month = jan,
day = "1",
doi = "10.1109/BigData55660.2022.10020885",
language = "English",
series = "Proceedings - 2022 IEEE International Conference on Big Data, Big Data 2022",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "2190--2197",
editor = "Shusaku Tsumoto and Yukio Ohsawa and Lei Chen and \{Van den Poel\}, Dirk and Xiaohua Hu and Yoichi Motomura and Takuya Takagi and Lingfei Wu and Ying Xie and Akihiro Abe and Vijay Raghavan",
booktitle = "Proceedings - 2022 IEEE International Conference on Big Data, Big Data 2022",
}