Hadoop GCP with Hive
GCP Hadoop Hive Tutorials
data:image/s3,"s3://crabby-images/b8fc4/b8fc47db7585d4a9e5a2e7a687e601ec513cde93" alt="GCP Hadoop Hive"
export REGION=us-central1 export ZONE=us-central1-a gcloud config set compute/zone $ZONE
data:image/s3,"s3://crabby-images/fdecb/fdecbfd873367ad348c594b779e3fb5c356ee571" alt="GCP Hadoop Hive"
gcloud services enable dataproc.googleapis.com sqladmin.googleapis.com
data:image/s3,"s3://crabby-images/22a37/22a37f8affe27cf89ea01d628dd35d8f2358062b" alt="GCP Hadoop Hive"
export PROJECT=$(gcloud info --format='value(config.project)') gsutil mb -l $REGION gs://$PROJECT-warehouse
data:image/s3,"s3://crabby-images/2e07f/2e07f96667eaa9ca97d61c0bccc8af983acc404c" alt="GCP Hadoop Hive"
gcloud sql instances create hive-metastore \ --database-version="MYSQL_5_7" \ --activation-policy=ALWAYS \ --gce-zone $ZONE
data:image/s3,"s3://crabby-images/6a27c/6a27ce8fb9c2b6aa2298a29ec42a26f34587d78e" alt="GCP Hadoop Hive"
gcloud dataproc clusters create hive-cluster \ --scopes sql-admin \ --image-version 1.3 \ --initialization-actions gs://dataproc-initialization-actions/cloud-sql-proxy/cloud-sql-proxy.sh \ --properties hive:hive.metastore.warehouse.dir=gs://$PROJECT-warehouse/datasets \ --metadata "hive-metastore-instance=$PROJECT:$REGION:hive-metastore"
data:image/s3,"s3://crabby-images/4ee4e/4ee4e75eab3886fe8116828f0446aaed69379ea0" alt="GCP Hadoop Hive"
gsutil cp gs://hive-solution/part-00000.parquet \ gs://$PROJECT-warehouse/datasets/transactions/part-00000.parquet
data:image/s3,"s3://crabby-images/3da28/3da2813cce161ef4852613e19de047c4b0623b23" alt="GCP Hadoop Hive"
gcloud dataproc jobs submit hive \ --cluster hive-cluster \ --execute " CREATE EXTERNAL TABLE transactions (SubmissionDate DATE, TransactionAmount DOUBLE, TransactionType STRING) STORED AS PARQUET LOCATION 'gs://$PROJECT-warehouse/datasets/transactions';"
data:image/s3,"s3://crabby-images/84136/84136adb56894704abc0e57cbcc5f642eab81815" alt="GCP Hadoop Hive"
gcloud dataproc jobs submit hive \ --cluster hive-cluster \ --execute " SELECT * FROM transactions LIMIT 10;"
data:image/s3,"s3://crabby-images/b1542/b1542e871b39f7e3091312768532f3148487e630" alt="GCP Hadoop Hive"
data:image/s3,"s3://crabby-images/f0631/f06314e92ae24d7f216808d86070684f5f7d8698" alt="GCP Hadoop Hive"