-
Notifications
You must be signed in to change notification settings - Fork 1k
/
hive_foreach_table.sh
executable file
·71 lines (51 loc) · 2.09 KB
/
hive_foreach_table.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
#!/usr/bin/env bash
# vim:ts=4:sts=4:sw=4:et
#
# Author: Hari Sekhon
# Date: 2019-12-06 11:10:26 +0000 (Fri, 06 Dec 2019)
#
# https://github.com/HariSekhon/DevOps-Bash-tools
#
# License: see accompanying Hari Sekhon LICENSE file
#
# If you're using my code you're welcome to connect with me on LinkedIn and optionally send me feedback to help steer this or other code I publish
#
# https://www.linkedin.com/in/HariSekhon
#
set -euo pipefail
[ -n "${DEBUG:-}" ] && set -x
srcdir="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
# shellcheck disable=SC1090,SC1091
. "$srcdir/lib/utils.sh"
# shellcheck disable=SC2034,SC2154
usage_description="
Run SQL query against all Hive tables in all databases via beeline
Query can contain {db} and {table} placeholders which will be replaced for each table
FILTER environment variable will restrict to matching fully qualified tables (<db>.<table>)
WARNING: do not run any subshell command reading from standard input, otherwise it will consume the db/table names and exit after the first iteration
Tested on Hive 1.1.0 on CDH 5.10, 5.16
For a better version written in Python see DevOps Python tools repo:
https://github.com/HariSekhon/DevOps-Python-tools
you will need to comment out / remove the 'set -o pipefail' to skip errors if you aren't authorized to use
any of the databases to avoid the script exiting early upon encountering any authorization error such:
ERROR: AuthorizationException: User '<user>@<domain>' does not have privileges to access: default Default Hive database.*.*
"
# used by usage() in lib/utils.sh
# shellcheck disable=SC2034
usage_args="\"<query>\" [<beeline_options>]"
help_usage "$@"
min_args 1 "$@"
query_template="$1"
shift || :
opts="--silent=true --outputformat=tsv2"
# exit the loop subshell if you Control-C
trap 'exit 130' INT
# shellcheck disable=SC2086
"$srcdir/hive_list_tables.sh" "$@" |
while read -r db table; do
printf '%s.%s\t' "$db" "$table"
query="${query_template//\{db\}/\`$db\`}"
query="${query//\{table\}/\`$table\`}"
"$srcdir/beeline.sh" $opts -e "USE \`$db\`; $query" "$@" |
tail -n +2
done