### 1. Create database ``` CREATE DATABASE my_delta_db; ``` ### 2. Create table
DROP TABLE IF EXISTS my_delta_db.delta_trip_table; CREATE EXTERNAL TABLE my_delta_db.delta_trip_table ( destination string, trip_id bigint, tstamp string, origin string ) PARTITIONED BY (route_id string) ROW FORMAT SERDE 'org.apache.hadoop.hive.ql.io.parquet.serde.ParquetHiveSerDe' STORED AS INPUTFORMAT 'org.apache.hadoop.hive.ql.io.SymlinkTextInputFormat' OUTPUTFORMAT 'org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat' LOCATION 's3://your-s3-location-for-delta-hive-table/_symlink_format_manifest/';### 3. Repair partitions ``` MSCK REPAIR TABLE my_delta_db.delta_trip_table; ``` ### 4. Others ``` SELECT count(*) FROM my_delta_db.delta_trip_table; SELECT max(trip_id) FROM my_delta_db.delta_trip_table; SELECT DISTINCT destination from my_delta_db.delta_trip_table ORDER BY destination; SELECT destination, route_id, trip_id, tstamp FROM my_delta_db.delta_trip_table LIMIT 10; SELECT DISTINCT route_id from my_delta_db.delta_trip_table ORDER BY route_id; SELECT * FROM my_delta_db.delta_trip_table WHERE trip_id > 1999996 ORDER BY trip_id; SELECT count(*) AS Count_Syracuse FROM my_delta_db.delta_trip_table WHERE destination = 'Syracuse'; SELECT count(*) AS Count_Philadelphia FROM my_delta_db.delta_trip_table WHERE destination = 'Philadelphia'; SELECT count(*) as Count_total FROM my_delta_db.delta_trip_table; SELECT count(*) as Count_NJ FROM my_delta_db.delta_trip_table WHERE destination = 'New Jersey'; ```