4 use Text::Unaccent 1.02; # 1.01 won't compile on my platform,
7 # how to convert isis code page to UTF8?
8 my $isis_map = Unicode::Map8->new('ISO-8859-2') || die "$!";
11 <author_swish>Skinner B. F. Skinner B. F. B. F. Skiner </author_swish>
12 <title_swish>Nauka i ljudsko ponasanje B. F. Skiner </title_swish>
13 <headline_swish>Nauka i ljudsko ponasanje B. F. Skiner 1969 </headline_swish>
15 <title_display>Nauka i ljudsko ponašanje / B. F. Skiner</title_display>
16 <headline_display>Nauka i ljudsko ponašanje / B. F. Skiner , 1969</headline_display>
17 <author_display>Skinner, B. F. -- 7oo 'Skinner' 'B. F.'</author_display>
20 my $test = "¹ðè澩ÐÈÆ®";
22 #print "original len: ",length($test),"\t$test\n";
23 print "original len: ",length($test),"\n";
25 my $tmp = $isis_map->tou($test)->utf8;
27 print "UTF8 len: ", length($tmp),"\t$tmp\n";
28 #print "UTF8 len: ", length($tmp),"\n";
30 $tmp = unac_string('ISO-8859-2',$test);
31 print "unacct_len: ", length($tmp),"\t$tmp\n";
32 #print "unacct_len: ", length($tmp),"\n";