@inproceedings{bc46ed4d1a7c4b8cabaab3c30cc72a0a,
title = "HyPerInsight: Data exploration deep inside hyper",
abstract = "Nowadays we are drowning in data of various varieties. For all these mixed types and categories of data there exist even more different analysis approaches, often done in single hand-written solutions. We propose to extend HyPer, a main memory database system to a uniform data agent platform following the {"}one system fits all{"} approach for solving a wide variety of data analysis problems. We achieve this by applying a flexible operator concept to a set of various important data exploration algorithms. With that, HyPer solves analytical questions using clustering, classification, association rule mining and graph mining besides standard HTAP (Hybrid Transaction and Analytical Processing) workloads on the same database state. It enables to approach the full variety and volume of HTAP extended for data exploration (HTAPx), and only needs knowledge of already introduced SQL extensions that are automatically optimized by the database's standard optimizer. In this demo we will focus on the benefits and flexibility we create by using the SQL extensions for several well-known mining workloads. In our interactive webinterface for this project named HyPerInsight we demonstrate how HyPer outperforms the best open source competitor Apache Spark in common use cases in social media, geo-data, recommender systems and several other.",
keywords = "Apriori, DBscan, Database operators, Hyper, Query processing, SQL, k-Means",
author = "Nina Hubig and Linnea Passing and Sch{\"u}le, {Maximilian E.} and Dimitri Vorona and Alfons Kemper and Thomas Neumann",
note = "Publisher Copyright: {\textcopyright} 2017 Association for Computing Machinery.; 26th ACM International Conference on Information and Knowledge Management, CIKM 2017 ; Conference date: 06-11-2017 Through 10-11-2017",
year = "2017",
month = nov,
day = "6",
doi = "10.1145/3132847.3133167",
language = "English",
series = "International Conference on Information and Knowledge Management, Proceedings",
publisher = "Association for Computing Machinery",
pages = "2467--2470",
booktitle = "CIKM 2017 - Proceedings of the 2017 ACM Conference on Information and Knowledge Management",
}