forked from apache/hive
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdump_schema
executable file
·71 lines (67 loc) · 1.97 KB
/
dump_schema
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
#! /usr/bin/perl -w
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
use strict;
use Data::Dumper;
my %primitive = (
'int' => 1,
'byte' => 1,
'string' => 1,
'float' => 1,
'long' => 1,
);
sub get_hive_cols($)
{
my $col = shift;
my $cmd = "echo 'describe $col;' | /mnt/vol/hive/stable/bin/hive_cli.py | grep '|'";
#print "$cmd\n";
my @cols = `$cmd`;
map { s/\|//g; s/^\s+//g; s/\s+$//g; s/\s+/ /g; } @cols;
#print Dumper(\@cols);
return @cols;
}
sub get_cols($$$)
{
my ($msg, $c, $t) = @_;
if ($primitive{lc($t)}) {
print "$msg$t:$c\n";
return;
}
elsif ($t =~ /List<(.*?)>/ and $primitive{lc($1)}) {
print "$msg$t:$c\n";
return;
}
my @cols = &get_hive_cols($c);
die "no cols!" unless @cols;
print "$msg$t {\n";
foreach (@cols) {
my ($name, $type) = split;
$name = "$c.$name";
&get_cols($msg."\t", $name, $type);
}
print "$msg}//$t\n";
}
#die "Usage: dump_schema tableName\n" unless @ARGV;
my $tablename = $ARGV[0];
$tablename = "." unless $tablename;
eval {
&get_cols("", $tablename, $tablename);
};
if ($@) {
my $cmd = "echo show | /mnt/vol/hive/stable/bin/hive_cli.py | grep '|' | tr '|' '\\n' | awk '{print \$1}' | grep -v ^\$ | grep $tablename | sort";
my @tables = `$cmd`;
print @tables;
}