added configuration for PerlMonks XML dump indexing
git-svn-id: svn+ssh://mjesec/home/dpavlin/svn/webpac2/trunk@991
07558da8-63fa-0310-ba24-
9fe276d99e06
- name: xml
module: 'WebPAC::Input::XML'
path: '/home/dpavlin/monk-search/xml-dump'
+ mungle: 'conf/mungle/perlmonks-xml.pl'
normalize:
- path: 'conf/normalize/perlmonks.pl'
+ path: 'conf/normalize/perlmonks.pl'
output:
- module: 'KinoSearch'
path: 'var/kinosearch'
--- /dev/null
+# special mungle file which prepare data_structure from XML
+
+my $h = get_ds->{node};
+warn "## $0 hash to work on = ",dump( $h );
+
+set_ds(
+ Title => $h->{title},
+ Author => $h->{author}->{content},
+ Date => $h->{created},
+ Content => $h->{doctext}->{content},
+ Type => $h->{type}->{content},
+);
+
+
--- /dev/null
+
+search_display( $_, rec( $_ ) ) foreach ( qw/
+Title
+Author
+Date
+Content
+Type
+/ );
+