From 9111b560f15f9a9cf366e0426107d6cdef0360bb Mon Sep 17 00:00:00 2001 From: Dobrica Pavlinusic Date: Tue, 19 Oct 2010 18:19:52 +0200 Subject: [PATCH] eprints-dev: /home/dpavlin/mtoolkit/utf8-fix.pl [commit] --- mtoolkit/utf8-fix.pl | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/mtoolkit/utf8-fix.pl b/mtoolkit/utf8-fix.pl index 3946bcd..3592209 100755 --- a/mtoolkit/utf8-fix.pl +++ b/mtoolkit/utf8-fix.pl @@ -67,8 +67,9 @@ s/$junk\xC2\x9D/-/gs && $stat->{'-- ?'}++; s/$junk\xC3\x82\xC2\xA2/- /gs && $stat->{'dot'}++; + my $e = $_; - if ( $e =~ m/([\xC0-\xC4][\x80-\xff]{4,8})/s ) { + if ( $e =~ m/([\xC0-\xC4][\x80-\xff]{3,99})/s ) { warn "XXX ", dump($e), "\n$e\n"; } print $e; -- 2.20.1