Hive-Class/hive-class-2.txt at main · SkF-Python1/Hive-Class

105 lines (77 loc) · 8.18 KB
create database hive_class_b1;
use hive_class_b1;
    > fields terminated by ','; 
describe department_data;
describe formatted department_data;
# For data load from local
load data local inpath 'file:///tmp/hive_class/depart_data.csv' into table department_data; 
# Display column name
set hive.cli.print.header = true;
# Load data from hdfs location
load data inpath '/tmp/hive_data_class_2/' into table department_data_from_hdfs;
# Create external table 
create external table department_data_external                                                                                          
    > location '/tmp/hive_data_class_2/'; 
# work with Array data types
    > collection items terminated by ':';                                                                                                     
load data local inpath 'file:///tmp/hive_class/array_data.csv' into table employee; 
# Get element by index in hive array data type
select id, name, skills[0] as prime_skill from employee;
    > size(skills) as size_of_each_array,                                                                                                     
    > array_contains(skills,"HADOOP") as knows_hadoop,                                                                                        
    > sort_array(skills) as sorted_array                                                                                                                     
    > from employee; 
# table for map data
create table employee_map_data                                                                                                          
    > collection items terminated by '|'                                                                                                      
    > map keys terminated by ':';
 load data local inpath 'file:///tmp/hive_class/map_data.csv' into table employee_map_data;
    > details["gender"] as employee_gender                                                                                                    
    > from employee_map_data; 
 # map functions
    > size(details) as size_of_each_map,                                                                                                      
    > map_keys(details) as distinct_map_keys,                                                                                                 
    > map_values(details) as distinct_map_values                                                                                              
    > from employee_map_data; 
# Assignment Dataset
https://www.kaggle.com/datasets/imdevskp/corona-virus-report
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

hive-class-2.txt

Latest commit

History

hive-class-2.txt

File metadata and controls