@inproceedings{3f3a1aa7dae04494a4f592378507bd92,
title = "A Hive and SQL Case Study in Cloud Data Analytics",
abstract = "The digital universe is expanding at a very fast pace generating massive datasets. In order to keep up with the processing and storage needs for this big data, and to discover knowledge, we need scalable infrastructure and technologies that can access data from multiple disks simultaneously. Cloud computing provides paradigms for data analytics over such huge datasets. While SQL continues to be popular among database and data mining professionals, in recent years Hive has established itself as a rapidly advancing technology for big data which makes it highly suitable for use over the cloud. In this paper, we present investigatory research on Hive and SQL with a detailed case study between them, considering cloud data management and mining. Our work here constitutes a thorough scrutiny, focusing on processing Hive queries on cloud infrastructure considering three different approaches, and also delving into SQL processing on the cloud with similar approaches. Real datasets are used for conducting various operations using Hive and SQL. This paper conducts performance comparisons of the two technologies and explains the environment in which one is preferred over the other for processing and analyzing data. It provides recommendations for cloud data analytics, based on the case study.",
keywords = "Big Data, Cloud Computing, Hadoop and Hive, Performance Comparisons, RDBMS and SQL",
author = "Shireesha Chandra and Varde, {Aparna S.} and Jiayin Wang",
year = "2019",
month = oct,
doi = "10.1109/UEMCON47517.2019.8992925",
language = "English",
series = "2019 IEEE 10th Annual Ubiquitous Computing, Electronics and Mobile Communication Conference, UEMCON 2019",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "112--118",
editor = "Satyajit Chakrabarti and Saha, {Himadri Nath}",
booktitle = "2019 IEEE 10th Annual Ubiquitous Computing, Electronics and Mobile Communication Conference, UEMCON 2019",
note = "10th IEEE Annual Ubiquitous Computing, Electronics and Mobile Communication Conference, UEMCON 2019 ; Conference date: 10-10-2019 Through 12-10-2019",
}