From 9f2251d20b2951b0559df175e1a6051990ab528c Mon Sep 17 00:00:00 2001 From: Dobrica Pavlinusic Date: Sat, 5 Jun 2010 15:54:12 +0200 Subject: [PATCH] __normalize_header to cleanup names --- lib/MojoFacets/Import/HTMLTable.pm | 17 +++++++++++++---- 1 file changed, 13 insertions(+), 4 deletions(-) diff --git a/lib/MojoFacets/Import/HTMLTable.pm b/lib/MojoFacets/Import/HTMLTable.pm index 22aea57..25c6406 100644 --- a/lib/MojoFacets/Import/HTMLTable.pm +++ b/lib/MojoFacets/Import/HTMLTable.pm @@ -11,6 +11,15 @@ use Data::Dump qw(dump); __PACKAGE__->attr('dir'); +sub __normalize_header { + map { + s/^\s+//s; + s/\s+$//s; + s/\s\s+/ /gs; + $_; + } @_ +} + sub data { my $self = shift; @@ -36,12 +45,12 @@ sub data { warn "# row ", dump( $row ),"\n"; if ( ! $stats->{$file} ) { if ( ! @header ) { - @header = @$row; + @header = __normalize_header( @$row ); warn "# new header ",dump(@header); $row = undef; } else { my $o = join('|', @header); - my $n = join('|', @$row); + my $n = join('|', __normalize_header(@$row)); if ( $o eq $n ) { warn "# same header again in $file skipping\n"; $row = undef; @@ -56,10 +65,10 @@ sub data { foreach my $i ( 0 .. $#$row ) { $item->{ $header[$i] } = [ $row->[$i] ]; } - warn "## item ",dump($item); + $stats->{$file}++; + warn "## item ",$stats->{$file}, ' ', dump($item); push @$items, $item; - $stats->{$file}++; } } } -- 2.20.1