Add a script to flatten json files into CSV.

Written to convert Flickr metadata json files into a CSV..
This commit is contained in:
Solomon Peachy 2019-12-14 23:18:16 -05:00
parent 4392a451e3
commit d4123bc61e
1 changed files with 86 additions and 0 deletions

86
json_to_csv.pl Executable file
View File

@ -0,0 +1,86 @@
#!/usr/bin/perl -w
##############################
#
# Quick & Dirty Flickr JSON flattening script
#
# Author: Solomon Peachy <solomon.peachy@philips.com>
#
#############################
use strict;
use JSON;
use utf8;
my $text;
my $doc;
my @flist;
my @database;
my %cols;
binmode STDOUT, ':utf8';
opendir (my $dh, ".") || die;
while (readdir($dh)) {
if (/json/) {
push(@flist, $_);
}
}
foreach my $file (@flist) {
$text = `cat $file`;
$doc = decode_json($text);
my %record;
foreach my $item (keys(%$doc)) {
my $val = $$doc{$item};
if (ref($val) eq "HASH") {
foreach my $subitem (keys(%$val)) {
my $subval = $$val{$subitem};
$cols{"$item-$subitem"} = 1;
$record{"$item-$subitem"} = $subval;
# print "$item-$subitem = $subval\n";
}
} elsif (ref($val) eq "ARRAY") {
my $i = 1;
foreach (@$val) {
my $aval = $$val[$i-1];
if (ref($aval) eq "HASH") {
foreach my $subitem (keys(%$aval)) {
my $subval = $$aval{$subitem};
$cols{"$item-$i-$subitem"} = 1;
$record{"$item-$i-$subitem"} = $subval;
# print "$item-$i-$subitem = $subval\n";
}
} else {
$cols{"$item-$i"} = 1;
$record{"$item-$i"} = $aval;
# print "$item-$i = $aval\n";
}
$i++;
}
} else {
$val =~ tr/\n/ /;
$cols{$item} = 1;
$record{$item} = $val;
# print "$item = $val\n";
}
}
push @database, \%record;
}
#exit(0);
### DONE, emit output.
foreach (sort(keys(%cols))) {
print "\"$_\",";
}
print "\n";
foreach my $row (@database) {
foreach (sort(keys(%cols))) {
if (defined($$row{$_})) {
print "\"$$row{$_}\",";
} else {
print ",";
}
}
print "\n";
};