#!/bin/bash HDINSIGHT_UTILITIES_FNAME='HDInsightUtilities-v01.sh' HDINSIGHT_UTILITIES="/tmp/$HDINSIGHT_UTILITIES_FNAME" # shellcheck source=/dev/null wget -O "$HDINSIGHT_UTILITIES" -q https://hdiconfigactions.blob.core.windows.net/linuxconfigactionmodulev01/$HDINSIGHT_UTILITIES_FNAME && source "$HDINSIGHT_UTILITIES" HIVE_MIGRATION_UTILS_FNAME='hive-migration-utils-v01.sh' HIVE_MIGRATION_UTILS="/tmp/$HIVE_MIGRATION_UTILS_FNAME" # shellcheck source=/dev/null wget -O "$HIVE_MIGRATION_UTILS" -q "https://hdiconfigactions.blob.core.windows.net/linuxhivemigrationv01/${HIVE_MIGRATION_UTILS_FNAME}" && source "$HIVE_MIGRATION_UTILS" PRIMARY_HEADNODE=$(get_primary_headnode) BEE_CMD=$(get_beeline_command_and_kinit "$PRIMARY_HEADNODE") OUTPUT_FILE='/tmp/hive_contents.out' rm -f ${OUTPUT_FILE} dbs=$(eval "$BEE_CMD -e 'SHOW DATABASES;'" | sort) for d in $dbs; do tables=$(eval "$BEE_CMD -e 'use $d; SHOW TABLES;'" | tr '\n' ' ' | tr -s ' ') for t in $tables; do [[ "$t" == "hivesampletable" && "$d" == "default" ]] && continue echo "${d}.${t}" >> "${OUTPUT_FILE}" ddl=$(eval "$BEE_CMD -e 'use $d; SHOW CREATE TABLE $t;'" | tr '\n' ' ' | tr -s ' '); flat_ddl=$(echo "$ddl" | tr '\n' ' ' | tr -s ' ' | sed 's/( /(/g') location_clause=$(echo "$flat_ddl" | sed -n "s|.*\( LOCATION '[^']*'\).*|\1|p") echo "${location_clause}" >> "${OUTPUT_FILE}" query="SELECT COUNT(*) FROM ${d}.${t}" echo "${query};" >> "${OUTPUT_FILE}" eval "$BEE_CMD -e '${query}'" | sort >> "${OUTPUT_FILE}" done done