projects
/
eprints3-migration.git
/ commitdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
| commitdiff |
tree
raw
|
patch
| inline |
side by side
(parent:
0a3f750
)
eprints-dev: /home/dpavlin/mtoolkit/utf8-fix.pl [commit]
author
Dobrica Pavlinusic
<dpavlin@rot13.org>
Tue, 19 Oct 2010 00:20:03 +0000
(
02:20
+0200)
committer
Dobrica Pavlinusic
<dpavlin@rot13.org>
Tue, 19 Oct 2010 00:20:03 +0000
(
02:20
+0200)
mtoolkit/utf8-fix.pl
patch
|
blob
|
history
diff --git
a/mtoolkit/utf8-fix.pl
b/mtoolkit/utf8-fix.pl
index
f78aa3c
..
3946bcd
100755
(executable)
--- a/
mtoolkit/utf8-fix.pl
+++ b/
mtoolkit/utf8-fix.pl
@@
-64,6
+64,8
@@
s/$junk\xC2\xAD/-/gs && $stat->{'-'}++;
s/$junk\xC2\x80\xC2\x9C/-/gs && $stat->{'--'}++;
s/$junk\xC2\x9D/-/gs && $stat->{'-- ?'}++;
+s/$junk\xC3\x82\xC2\xA2/- /gs && $stat->{'dot'}++;
+
my $e = $_;
if ( $e =~ m/([\xC0-\xC4][\x80-\xff]{4,8})/s ) {