#!/usr/bin/env bash # vim:ts=4:sts=4:sw=4:et # # Author: Hari Sekhon # Date: 2019-12-10 11:33:52 +0000 (Tue, 10 Dec 2019) # # https://github.com/harisekhon/bash-tools # # License: see accompanying Hari Sekhon LICENSE file # # If you're using my code you're welcome to connect with me on LinkedIn and optionally send me feedback to help steer this or other code I publish # # https://www.linkedin.com/in/harisekhon # set -euo pipefail [ -n "${DEBUG:-}" ] && set -x srcdir="$(dirname "${BASH_SOURCE[0]}")" # shellcheck disable=SC1090 . "$srcdir/lib/utils.sh" # shellcheck disable=SC2034,SC2154 usage_description=" Lists all Impala tables in all databases using adjacent impala_shell.sh script FILTER environment variable will restrict to matching fully qualified tables (.) Tested on Impala 2.7.0, 2.12.0 on CDH 5.10, 5.16 with Kerberos and SSL For more documentation see the comments at the top of impala_shell.sh For a better version written in Python see DevOps Python tools repo: https://github.com/harisekhon/devops-python-tools you will need to comment out / remove 'set -o pipefail' below to skip errors if you aren't authorized to use any of the databases to avoid the script exiting early upon encountering any authorization error such: ERROR: AuthorizationException: User '@' does not have privileges to access: default Default Hive database.*.* " # used by usage() in lib/utils.sh # shellcheck disable=SC2034 usage_args="[]" help_usage "$@" "$srcdir/impala_list_databases.sh" | while read -r db; do "$srcdir/impala_shell.sh" --quiet -Bq "SHOW TABLES IN \`$db\`" "$@" | sed "s/^/$db /" done | while read -r db table; do if [ -n "${FILTER:-}" ] && ! [[ "$db.$table" =~ $FILTER ]]; then continue fi printf '%s\t%s\n' "$db" "$table" done